Add comprehensive usage-based subscription system with API tracking

Co-authored-by: ajay.calsoft <ajay.calsoft@gmail.com>
2025-09-04 17:18:27 +00:00
parent d57f7feb4a
commit e0a6150ed1
13 changed files with 3619 additions and 10 deletions
--- a/backend/services/pricing_service.py
+++ b/backend/services/pricing_service.py
@@ -0,0 +1,433 @@
+"""
+Pricing Service for API Usage Tracking
+Manages API pricing, cost calculation, and subscription limits.
+"""
+
+from typing import Dict, Any, Optional, List, Tuple
+from decimal import Decimal, ROUND_HALF_UP
+from datetime import datetime, timedelta
+from sqlalchemy.orm import Session
+from loguru import logger
+
+from models.subscription_models import (
+    APIProviderPricing, SubscriptionPlan, UserSubscription, 
+    UsageSummary, APIUsageLog, APIProvider, SubscriptionTier
+)
+
+class PricingService:
+    """Service for managing API pricing and cost calculations."""
+    
+    def __init__(self, db: Session):
+        self.db = db
+        self._pricing_cache = {}
+        self._plans_cache = {}
+        
+    def initialize_default_pricing(self):
+        """Initialize default pricing for all API providers."""
+        
+        # Gemini API Pricing (as of January 2025)
+        gemini_pricing = [
+            {
+                "provider": APIProvider.GEMINI,
+                "model_name": "gemini-2.0-flash-lite",
+                "cost_per_input_token": 0.000000375,  # $0.075 per 1M input tokens (up to 128k context)
+                "cost_per_output_token": 0.0000003,   # $0.30 per 1M output tokens
+                "description": "Gemini 2.0 Flash Lite - Fast and efficient model"
+            },
+            {
+                "provider": APIProvider.GEMINI,
+                "model_name": "gemini-2.5-flash",
+                "cost_per_input_token": 0.000000625,  # $0.125 per 1M input tokens (up to 1M context)
+                "cost_per_output_token": 0.000000375,  # $0.375 per 1M output tokens
+                "description": "Gemini 2.5 Flash - Balanced performance and cost"
+            },
+            {
+                "provider": APIProvider.GEMINI,
+                "model_name": "gemini-2.5-pro",
+                "cost_per_input_token": 0.00000125,   # $1.25 per 1M input tokens (up to 200k context)
+                "cost_per_output_token": 0.00001,     # $10.00 per 1M output tokens
+                "description": "Gemini 2.5 Pro - Most capable model"
+            }
+        ]
+        
+        # OpenAI Pricing (estimated, will be updated)
+        openai_pricing = [
+            {
+                "provider": APIProvider.OPENAI,
+                "model_name": "gpt-4o",
+                "cost_per_input_token": 0.0000025,    # $2.50 per 1M input tokens
+                "cost_per_output_token": 0.00001,     # $10.00 per 1M output tokens
+                "description": "GPT-4o - Latest OpenAI model"
+            },
+            {
+                "provider": APIProvider.OPENAI,
+                "model_name": "gpt-4o-mini",
+                "cost_per_input_token": 0.00000015,   # $0.15 per 1M input tokens
+                "cost_per_output_token": 0.0000006,   # $0.60 per 1M output tokens
+                "description": "GPT-4o Mini - Cost-effective model"
+            }
+        ]
+        
+        # Anthropic Pricing (estimated, will be updated)
+        anthropic_pricing = [
+            {
+                "provider": APIProvider.ANTHROPIC,
+                "model_name": "claude-3.5-sonnet",
+                "cost_per_input_token": 0.000003,     # $3.00 per 1M input tokens
+                "cost_per_output_token": 0.000015,    # $15.00 per 1M output tokens
+                "description": "Claude 3.5 Sonnet - Anthropic's flagship model"
+            }
+        ]
+        
+        # Search API Pricing (estimated)
+        search_pricing = [
+            {
+                "provider": APIProvider.TAVILY,
+                "model_name": "tavily-search",
+                "cost_per_request": 0.001,  # $0.001 per search
+                "description": "Tavily AI Search API"
+            },
+            {
+                "provider": APIProvider.SERPER,
+                "model_name": "serper-search",
+                "cost_per_request": 0.001,  # $0.001 per search
+                "description": "Serper Google Search API"
+            },
+            {
+                "provider": APIProvider.METAPHOR,
+                "model_name": "metaphor-search",
+                "cost_per_request": 0.003,  # $0.003 per search
+                "description": "Metaphor/Exa AI Search API"
+            },
+            {
+                "provider": APIProvider.FIRECRAWL,
+                "model_name": "firecrawl-extract",
+                "cost_per_page": 0.002,  # $0.002 per page crawled
+                "description": "Firecrawl Web Extraction API"
+            },
+            {
+                "provider": APIProvider.STABILITY,
+                "model_name": "stable-diffusion",
+                "cost_per_image": 0.04,  # $0.04 per image
+                "description": "Stability AI Image Generation"
+            }
+        ]
+        
+        # Combine all pricing data
+        all_pricing = gemini_pricing + openai_pricing + anthropic_pricing + search_pricing
+        
+        # Insert pricing data
+        for pricing_data in all_pricing:
+            existing = self.db.query(APIProviderPricing).filter(
+                APIProviderPricing.provider == pricing_data["provider"],
+                APIProviderPricing.model_name == pricing_data["model_name"]
+            ).first()
+            
+            if not existing:
+                pricing = APIProviderPricing(**pricing_data)
+                self.db.add(pricing)
+        
+        self.db.commit()
+        logger.info("Default API pricing initialized")
+    
+    def initialize_default_plans(self):
+        """Initialize default subscription plans."""
+        
+        plans = [
+            {
+                "name": "Free",
+                "tier": SubscriptionTier.FREE,
+                "price_monthly": 0.0,
+                "price_yearly": 0.0,
+                "gemini_calls_limit": 100,
+                "openai_calls_limit": 0,
+                "anthropic_calls_limit": 0,
+                "mistral_calls_limit": 50,
+                "tavily_calls_limit": 20,
+                "serper_calls_limit": 20,
+                "metaphor_calls_limit": 10,
+                "firecrawl_calls_limit": 10,
+                "stability_calls_limit": 5,
+                "gemini_tokens_limit": 100000,
+                "monthly_cost_limit": 0.0,
+                "features": ["basic_content_generation", "limited_research"],
+                "description": "Perfect for trying out ALwrity"
+            },
+            {
+                "name": "Basic",
+                "tier": SubscriptionTier.BASIC,
+                "price_monthly": 29.0,
+                "price_yearly": 290.0,
+                "gemini_calls_limit": 1000,
+                "openai_calls_limit": 500,
+                "anthropic_calls_limit": 200,
+                "mistral_calls_limit": 500,
+                "tavily_calls_limit": 200,
+                "serper_calls_limit": 200,
+                "metaphor_calls_limit": 100,
+                "firecrawl_calls_limit": 100,
+                "stability_calls_limit": 50,
+                "gemini_tokens_limit": 1000000,
+                "openai_tokens_limit": 500000,
+                "anthropic_tokens_limit": 200000,
+                "mistral_tokens_limit": 500000,
+                "monthly_cost_limit": 50.0,
+                "features": ["full_content_generation", "advanced_research", "basic_analytics"],
+                "description": "Great for individuals and small teams"
+            },
+            {
+                "name": "Pro",
+                "tier": SubscriptionTier.PRO,
+                "price_monthly": 79.0,
+                "price_yearly": 790.0,
+                "gemini_calls_limit": 5000,
+                "openai_calls_limit": 2500,
+                "anthropic_calls_limit": 1000,
+                "mistral_calls_limit": 2500,
+                "tavily_calls_limit": 1000,
+                "serper_calls_limit": 1000,
+                "metaphor_calls_limit": 500,
+                "firecrawl_calls_limit": 500,
+                "stability_calls_limit": 200,
+                "gemini_tokens_limit": 5000000,
+                "openai_tokens_limit": 2500000,
+                "anthropic_tokens_limit": 1000000,
+                "mistral_tokens_limit": 2500000,
+                "monthly_cost_limit": 150.0,
+                "features": ["unlimited_content_generation", "premium_research", "advanced_analytics", "priority_support"],
+                "description": "Perfect for growing businesses"
+            },
+            {
+                "name": "Enterprise",
+                "tier": SubscriptionTier.ENTERPRISE,
+                "price_monthly": 199.0,
+                "price_yearly": 1990.0,
+                "gemini_calls_limit": 0,  # Unlimited
+                "openai_calls_limit": 0,
+                "anthropic_calls_limit": 0,
+                "mistral_calls_limit": 0,
+                "tavily_calls_limit": 0,
+                "serper_calls_limit": 0,
+                "metaphor_calls_limit": 0,
+                "firecrawl_calls_limit": 0,
+                "stability_calls_limit": 0,
+                "gemini_tokens_limit": 0,
+                "openai_tokens_limit": 0,
+                "anthropic_tokens_limit": 0,
+                "mistral_tokens_limit": 0,
+                "monthly_cost_limit": 500.0,
+                "features": ["unlimited_everything", "white_label", "dedicated_support", "custom_integrations"],
+                "description": "For large organizations with high-volume needs"
+            }
+        ]
+        
+        for plan_data in plans:
+            existing = self.db.query(SubscriptionPlan).filter(
+                SubscriptionPlan.name == plan_data["name"]
+            ).first()
+            
+            if not existing:
+                plan = SubscriptionPlan(**plan_data)
+                self.db.add(plan)
+        
+        self.db.commit()
+        logger.info("Default subscription plans initialized")
+    
+    def calculate_api_cost(self, provider: APIProvider, model_name: str, 
+                          tokens_input: int = 0, tokens_output: int = 0, 
+                          request_count: int = 1, **kwargs) -> Dict[str, float]:
+        """Calculate cost for an API call."""
+        
+        # Get pricing for the provider and model
+        pricing = self.db.query(APIProviderPricing).filter(
+            APIProviderPricing.provider == provider,
+            APIProviderPricing.model_name == model_name,
+            APIProviderPricing.is_active == True
+        ).first()
+        
+        if not pricing:
+            logger.warning(f"No pricing found for {provider.value}:{model_name}, using default estimates")
+            # Use default estimates
+            cost_input = tokens_input * 0.000001  # $1 per 1M tokens default
+            cost_output = tokens_output * 0.000001
+            cost_total = (cost_input + cost_output) * request_count
+        else:
+            # Calculate based on actual pricing
+            cost_input = tokens_input * pricing.cost_per_input_token
+            cost_output = tokens_output * pricing.cost_per_output_token
+            cost_request = request_count * pricing.cost_per_request
+            
+            # Handle special cases for non-LLM APIs
+            cost_search = kwargs.get('search_count', 0) * pricing.cost_per_search
+            cost_image = kwargs.get('image_count', 0) * pricing.cost_per_image
+            cost_page = kwargs.get('page_count', 0) * pricing.cost_per_page
+            
+            cost_total = cost_input + cost_output + cost_request + cost_search + cost_image + cost_page
+        
+        # Round to 6 decimal places for precision
+        return {
+            'cost_input': round(cost_input, 6),
+            'cost_output': round(cost_output, 6),
+            'cost_total': round(cost_total, 6)
+        }
+    
+    def get_user_limits(self, user_id: str) -> Optional[Dict[str, Any]]:
+        """Get usage limits for a user based on their subscription."""
+        
+        subscription = self.db.query(UserSubscription).filter(
+            UserSubscription.user_id == user_id,
+            UserSubscription.is_active == True
+        ).first()
+        
+        if not subscription:
+            # Return free tier limits
+            free_plan = self.db.query(SubscriptionPlan).filter(
+                SubscriptionPlan.tier == SubscriptionTier.FREE
+            ).first()
+            if free_plan:
+                return self._plan_to_limits_dict(free_plan)
+            return None
+        
+        return self._plan_to_limits_dict(subscription.plan)
+    
+    def _plan_to_limits_dict(self, plan: SubscriptionPlan) -> Dict[str, Any]:
+        """Convert subscription plan to limits dictionary."""
+        return {
+            'plan_name': plan.name,
+            'tier': plan.tier.value,
+            'limits': {
+                'gemini_calls': plan.gemini_calls_limit,
+                'openai_calls': plan.openai_calls_limit,
+                'anthropic_calls': plan.anthropic_calls_limit,
+                'mistral_calls': plan.mistral_calls_limit,
+                'tavily_calls': plan.tavily_calls_limit,
+                'serper_calls': plan.serper_calls_limit,
+                'metaphor_calls': plan.metaphor_calls_limit,
+                'firecrawl_calls': plan.firecrawl_calls_limit,
+                'stability_calls': plan.stability_calls_limit,
+                'gemini_tokens': plan.gemini_tokens_limit,
+                'openai_tokens': plan.openai_tokens_limit,
+                'anthropic_tokens': plan.anthropic_tokens_limit,
+                'mistral_tokens': plan.mistral_tokens_limit,
+                'monthly_cost': plan.monthly_cost_limit
+            },
+            'features': plan.features or []
+        }
+    
+    def check_usage_limits(self, user_id: str, provider: APIProvider, 
+                          tokens_requested: int = 0) -> Tuple[bool, str, Dict[str, Any]]:
+        """Check if user can make an API call within their limits."""
+        
+        # Get user limits
+        limits = self.get_user_limits(user_id)
+        if not limits:
+            return False, "No subscription plan found", {}
+        
+        # Get current usage for this billing period
+        current_period = datetime.now().strftime("%Y-%m")
+        usage = self.db.query(UsageSummary).filter(
+            UsageSummary.user_id == user_id,
+            UsageSummary.billing_period == current_period
+        ).first()
+        
+        if not usage:
+            # First usage this period, create summary
+            usage = UsageSummary(
+                user_id=user_id,
+                billing_period=current_period
+            )
+            self.db.add(usage)
+            self.db.commit()
+        
+        # Check call limits
+        provider_name = provider.value
+        current_calls = getattr(usage, f"{provider_name}_calls", 0)
+        call_limit = limits['limits'].get(f"{provider_name}_calls", 0)
+        
+        if call_limit > 0 and current_calls >= call_limit:
+            return False, f"API call limit reached for {provider_name}", {
+                'current_calls': current_calls,
+                'limit': call_limit,
+                'usage_percentage': 100.0
+            }
+        
+        # Check token limits for LLM providers
+        if provider in [APIProvider.GEMINI, APIProvider.OPENAI, APIProvider.ANTHROPIC, APIProvider.MISTRAL]:
+            current_tokens = getattr(usage, f"{provider_name}_tokens", 0)
+            token_limit = limits['limits'].get(f"{provider_name}_tokens", 0)
+            
+            if token_limit > 0 and (current_tokens + tokens_requested) > token_limit:
+                return False, f"Token limit would be exceeded for {provider_name}", {
+                    'current_tokens': current_tokens,
+                    'requested_tokens': tokens_requested,
+                    'limit': token_limit,
+                    'usage_percentage': ((current_tokens + tokens_requested) / token_limit) * 100
+                }
+        
+        # Check cost limits
+        cost_limit = limits['limits'].get('monthly_cost', 0)
+        if cost_limit > 0 and usage.total_cost >= cost_limit:
+            return False, "Monthly cost limit reached", {
+                'current_cost': usage.total_cost,
+                'limit': cost_limit,
+                'usage_percentage': 100.0
+            }
+        
+        # Calculate usage percentages for warnings
+        call_usage_pct = (current_calls / max(call_limit, 1)) * 100 if call_limit > 0 else 0
+        cost_usage_pct = (usage.total_cost / max(cost_limit, 1)) * 100 if cost_limit > 0 else 0
+        
+        return True, "Within limits", {
+            'current_calls': current_calls,
+            'call_limit': call_limit,
+            'call_usage_percentage': call_usage_pct,
+            'current_cost': usage.total_cost,
+            'cost_limit': cost_limit,
+            'cost_usage_percentage': cost_usage_pct
+        }
+    
+    def estimate_tokens(self, text: str, provider: APIProvider) -> int:
+        """Estimate token count for text based on provider."""
+        
+        # Get pricing info for token estimation
+        pricing = self.db.query(APIProviderPricing).filter(
+            APIProviderPricing.provider == provider,
+            APIProviderPricing.is_active == True
+        ).first()
+        
+        if pricing and pricing.tokens_per_word:
+            # Use provider-specific conversion
+            word_count = len(text.split())
+            return int(word_count * pricing.tokens_per_word)
+        else:
+            # Use default estimation (roughly 1.3 tokens per word for most models)
+            word_count = len(text.split())
+            return int(word_count * 1.3)
+    
+    def get_pricing_info(self, provider: APIProvider, model_name: str = None) -> Optional[Dict[str, Any]]:
+        """Get pricing information for a provider/model."""
+        
+        query = self.db.query(APIProviderPricing).filter(
+            APIProviderPricing.provider == provider,
+            APIProviderPricing.is_active == True
+        )
+        
+        if model_name:
+            query = query.filter(APIProviderPricing.model_name == model_name)
+        
+        pricing = query.first()
+        
+        if not pricing:
+            return None
+        
+        return {
+            'provider': pricing.provider.value,
+            'model_name': pricing.model_name,
+            'cost_per_input_token': pricing.cost_per_input_token,
+            'cost_per_output_token': pricing.cost_per_output_token,
+            'cost_per_request': pricing.cost_per_request,
+            'cost_per_search': pricing.cost_per_search,
+            'cost_per_image': pricing.cost_per_image,
+            'cost_per_page': pricing.cost_per_page,
+            'description': pricing.description
+        }