openevidence-cost-tuning

Optimize OpenEvidence API costs and usage efficiency. Use when reducing API costs, implementing usage budgets, or optimizing DeepConsult spend for clinical AI applications. Trigger with phrases like "openevidence cost", "openevidence billing", "reduce openevidence spend", "openevidence budget", "openevidence pricing". allowed-tools: Read, Write, Edit version: 1.0.0 license: MIT author: Jeremy Longshore <jeremy@intentsolutions.io>

v1.0.0

Jeremy Longshore

MIT

Allowed Tools

No tools specified

Provided by Plugin

openevidence-pack

Claude Code skill pack for OpenEvidence medical AI (24 skills)

saas packs v1.0.0

View Plugin

Installation

This skill is included in the openevidence-pack plugin:

/plugin install openevidence-pack@claude-code-plugins-plus

Click to copy

Instructions

# OpenEvidence Cost Tuning ## Overview Optimize OpenEvidence API costs while maintaining clinical decision support quality. ## Prerequisites - OpenEvidence billing dashboard access - Usage metrics configured - Understanding of pricing model - Budget authority ## Pricing Model Overview | Feature | Unit | Typical Cost | |---------|------|--------------| | Clinical Query | Per query | Included in subscription | | DeepConsult | Per research synthesis | Premium (100x query cost) | | API Overage | Per 1000 queries over limit | Tier-dependent | | Enterprise Features | Monthly | Custom pricing | ## Instructions ### Step 1: Usage Tracking & Budgeting ```typescript // src/cost/usage-tracker.ts interface UsageBudget { dailyQueryLimit: number; dailyDeepConsultLimit: number; monthlyBudget: number; alertThreshold: number; // 0-1 } interface UsageRecord { queries: number; deepConsults: number; estimatedCost: number; period: 'daily' | 'monthly'; } export class UsageTracker { private redis: Redis; private budget: UsageBudget; private costPerQuery = 0; // Included in subscription private costPerDeepConsult = 10; // Example - check actual pricing constructor(redis: Redis, budget: UsageBudget) { this.redis = redis; this.budget = budget; } async trackQuery(userId: string): Promise { const today = new Date().toISOString().split('T')[0]; const month = today.substring(0, 7); await this.redis.hincrby(`usage:daily:${today}`, 'queries', 1); await this.redis.hincrby(`usage:daily:${today}`, `user:${userId}:queries`, 1); await this.redis.hincrby(`usage:monthly:${month}`, 'queries', 1); await this.checkBudgetAlerts(today, month); } async trackDeepConsult(userId: string): Promise { const today = new Date().toISOString().split('T')[0]; const month = today.substring(0, 7); await this.redis.hincrby(`usage:daily:${today}`, 'deepConsults', 1); await this.redis.hincrby(`usage:daily:${today}`, `user:${userId}:deepConsults`, 1); await this.redis.hincrby(`usage:monthly:${month}`, 'deepConsults', 1); await this.checkBudgetAlerts(today, month); } async canMakeQuery(): Promise<{ allowed: boolean; reason?: string }> { const today = new Date().toISOString().split('T')[0]; const dailyQueries = parseInt( await this.redis.hget(`usage:daily:${today}`, 'queries') || '0' ); if (dailyQueries >= this.budget.dailyQueryLimit) { return { allowed: false, reason: `Daily query limit (${this.budget.dailyQueryLimit}) reached`, }; } return { allowed: true }; } async canRunDeepConsult(): Promise<{ allowed: boolean; reason?: string }> { const today = new Date().toISOString().split('T')[0]; const dailyDeepConsults = parseInt( await this.redis.hget(`usage:daily:${today}`, 'deepConsults') || '0' ); if (dailyDeepConsults >= this.budget.dailyDeepConsultLimit) { return { allowed: false, reason: `Daily DeepConsult limit (${this.budget.dailyDeepConsultLimit}) reached`, }; } // Check monthly budget const month = today.substring(0, 7); const monthlyUsage = await this.getMonthlyUsage(month); if (monthlyUsage.estimatedCost >= this.budget.monthlyBudget) { return { allowed: false, reason: `Monthly budget ($${this.budget.monthlyBudget}) reached`, }; } return { allowed: true }; } async getMonthlyUsage(month: string): Promise { const queries = parseInt( await this.redis.hget(`usage:monthly:${month}`, 'queries') || '0' ); const deepConsults = parseInt( await this.redis.hget(`usage:monthly:${month}`, 'deepConsults') || '0' ); return { queries, deepConsults, estimatedCost: queries * this.costPerQuery + deepConsults * this.costPerDeepConsult, period: 'monthly', }; } private async checkBudgetAlerts(today: string, month: string): Promise { const monthlyUsage = await this.getMonthlyUsage(month); const usagePercent = monthlyUsage.estimatedCost / this.budget.monthlyBudget; if (usagePercent >= this.budget.alertThreshold) { await this.sendBudgetAlert(usagePercent, monthlyUsage); } } private async sendBudgetAlert(percent: number, usage: UsageRecord): Promise { // Send alert to admins console.warn(`[Budget Alert] ${(percent * 100).toFixed(0)}% of monthly budget used`); // Implement notification service call here } } ``` ### Step 2: Smart DeepConsult Management ```typescript // src/cost/deepconsult-optimizer.ts // DeepConsult costs 100x+ more than regular queries interface DeepConsultDecision { shouldUseDeepConsult: boolean; reason: string; alternativeApproach?: string; } export function shouldUseDeepConsult( question: string, context: ClinicalContext, userTier: 'free' | 'professional' | 'enterprise' ): DeepConsultDecision { // Never use DeepConsult for simple questions const simplePatterns = [ /what is the (dose|dosage)/i, /half-life of/i, /contraindications for/i, /side effects of/i, ]; if (simplePatterns.some(p => p.test(question))) { return { shouldUseDeepConsult: false, reason: 'Simple question - regular query sufficient', alternativeApproach: 'Use standard clinical query', }; } // DeepConsult good for complex research const complexPatterns = [ /compare.*treatments?/i, /systematic review/i, /evidence (for|against)/i, /recent advances/i, /emerging therapies/i, ]; if (complexPatterns.some(p => p.test(question))) { if (userTier === 'free') { return { shouldUseDeepConsult: false, reason: 'DeepConsult not available for free tier', alternativeApproach: 'Upgrade to Professional or run multiple targeted queries', }; } return { shouldUseDeepConsult: true, reason: 'Complex research question benefits from DeepConsult', }; } return { shouldUseDeepConsult: false, reason: 'Standard clinical query recommended', alternativeApproach: 'Try regular query first, escalate if insufficient', }; } // Cache DeepConsult results aggressively const DEEPCONSULT_CACHE_TTL = 7 * 24 * 60 * 60; // 1 week export async function getCachedOrRunDeepConsult( question: string, context: ClinicalContext, cache: ClinicalQueryCache ): Promise { // Check for similar cached reports const cacheKey = `deepconsult:${hashQuestion(question, context)}`; const cached = await cache.get(cacheKey); if (cached) { console.log('[Cost] Using cached DeepConsult report'); return cached; } return null; // Caller should run DeepConsult and cache result } ``` ### Step 3: User Quotas & Tiering ```typescript // src/cost/user-quotas.ts interface UserQuota { dailyQueries: number; monthlyQueries: number; deepConsultsPerMonth: number; features: string[]; } const USER_TIERS: Record = { free: { dailyQueries: 10, monthlyQueries: 100, deepConsultsPerMonth: 0, features: ['clinical_query'], }, professional: { dailyQueries: 100, monthlyQueries: 2000, deepConsultsPerMonth: 10, features: ['clinical_query', 'deepconsult', 'guidelines'], }, enterprise: { dailyQueries: 1000, monthlyQueries: 30000, deepConsultsPerMonth: 100, features: ['clinical_query', 'deepconsult', 'guidelines', 'api_access', 'ehr_integration'], }, }; export class UserQuotaManager { async checkQuota(userId: string, feature: string): Promise<{ allowed: boolean; remaining?: number; upgradeMessage?: string; }> { const user = await db.users.findUnique({ where: { id: userId } }); const tier = user?.tier || 'free'; const quota = USER_TIERS[tier]; if (!quota.features.includes(feature)) { return { allowed: false, upgradeMessage: `${feature} requires Professional tier or higher`, }; } const usage = await this.getUserUsage(userId); if (feature === 'clinical_query') { const remaining = quota.dailyQueries - usage.dailyQueries; return { allowed: remaining > 0, remaining, upgradeMessage: remaining <= 0 ? 'Daily query limit reached. Upgrade for more.' : undefined, }; } if (feature === 'deepconsult') { const remaining = quota.deepConsultsPerMonth - usage.monthlyDeepConsults; return { allowed: remaining > 0, remaining, upgradeMessage: remaining <= 0 ? 'Monthly DeepConsult limit reached. Contact sales.' : undefined, }; } return { allowed: true }; } private async getUserUsage(userId: string): Promise { // Implementation to get user's current usage return { dailyQueries: 0, monthlyDeepConsults: 0 }; } } ``` ### Step 4: Cost Reporting Dashboard ```typescript // src/cost/reporting.ts export async function generateCostReport( startDate: Date, endDate: Date ): Promise { // Aggregate usage data const usage = await aggregateUsage(startDate, endDate); const report: CostReport = { period: { start: startDate, end: endDate }, summary: { totalQueries: usage.queries, totalDeepConsults: usage.deepConsults, estimatedCost: calculateCost(usage), costPerQuery: usage.queries > 0 ? calculateCost(usage) / usage.queries : 0, }, breakdown: { bySpecialty: usage.bySpecialty, byUser: usage.byUser, byDay: usage.byDay, }, recommendations: generateRecommendations(usage), }; return report; } function generateRecommendations(usage: any): string[] { const recommendations: string[] = []; // Check for high DeepConsult usage if (usage.deepConsults > usage.queries * 0.1) { recommendations.push( 'DeepConsult usage is high. Consider caching results or using regular queries for simpler questions.' ); } // Check for low cache hit rate if (usage.cacheHitRate < 0.5) { recommendations.push( 'Cache hit rate is low. Review caching strategy and TTL settings.' ); } // Check for concentrated usage const topUser = Object.entries(usage.byUser) .sort((a, b) => (b[1] as number) - (a[1] as number))[0]; if (topUser && (topUser[1] as number) > usage.queries * 0.5) { recommendations.push( `User ${topUser[0]} accounts for over 50% of usage. Review for potential optimization.` ); } return recommendations; } ``` ## Cost Optimization Checklist - [ ] Usage tracking enabled - [ ] Daily/monthly budgets set - [ ] Alert thresholds configured - [ ] DeepConsult decision logic in place - [ ] User quotas implemented - [ ] Caching maximized - [ ] Cost reports automated ## Output - Usage tracking and budgeting system - Smart DeepConsult management - User quota enforcement - Cost reporting dashboard - Optimization recommendations ## Error Handling | Cost Issue | Detection | Resolution | |------------|-----------|------------| | Budget exceeded | Alert triggered | Implement throttling or upgrade | | High DeepConsult costs | Monthly report | Review usage patterns, improve caching | | Low cache efficiency | Metrics show low hits | Adjust TTL, increase cache size | | User abuse | Usage concentration | Implement per-user quotas | ## Resources - [OpenEvidence Pricing](https://www.openevidence.com/pricing) - [OpenEvidence API Terms](https://www.openevidence.com/policies/api) ## Next Steps For architecture best practices, see `openevidence-reference-architecture`.