""" Bing Webmaster Tools Analytics Handler Handles Bing Webmaster Tools analytics data retrieval and processing. """ from typing import Dict, Any from datetime import datetime, timedelta from loguru import logger from services.integrations.bing_oauth import BingOAuthService from ...analytics_cache_service import analytics_cache from ..models.analytics_data import AnalyticsData from ..models.platform_types import PlatformType from .base_handler import BaseAnalyticsHandler from ..insights.bing_insights_service import BingInsightsService from services.bing_analytics_storage_service import BingAnalyticsStorageService from services.database import get_user_db_path class BingAnalyticsHandler(BaseAnalyticsHandler): """ Handler for Bing Webmaster Tools analytics NOTE (2026-02-14): Known issues and directions - Verified sites list can be empty despite valid tokens. This leads to partial/error states and prevents storage collection. Direction: UI now provides a manual site picker (with primary website fallback from onboarding) to trigger storage collection, and a future improvement should accept a target_url from /api/analytics/data to influence site selection here. - Token state mismatch (status shows connected, analytics reports expired) can happen across cache boundaries. Direction: The frontend auto-resyncs once after OAuth success and provides a backend cache clear endpoint. - Storage-backed summary reads rely on a selected site; when sites are missing, selected_site is None. Direction: Allow explicit site_url parameter in the analytics orchestrator to override selected_site resolution. """ def __init__(self): super().__init__(PlatformType.BING) self.bing_service = BingOAuthService() def _get_storage_service(self, user_id: str) -> BingAnalyticsStorageService: """Get user-specific storage service.""" db_path = get_user_db_path(user_id) db_url = f'sqlite:///{db_path}' return BingAnalyticsStorageService(db_url) def _get_insights_service(self, user_id: str) -> BingInsightsService: """Get user-specific insights service.""" # For now, insights might be in a separate DB or same. # User requested isolation, so same user DB is best. db_path = get_user_db_path(user_id) db_url = f'sqlite:///{db_path}' return BingInsightsService(db_url) async def get_analytics(self, user_id: str, target_url: str = None, start_date: str = None, end_date: str = None, **kwargs) -> AnalyticsData: """ Get Bing Webmaster analytics data using Bing Webmaster API """ self.log_analytics_request(user_id, "get_analytics") # Check cache first (include date range and target_url in key) cache_key_parts = [user_id] if target_url: cache_key_parts.append(str(target_url)) if start_date: cache_key_parts.append(str(start_date)) if end_date: cache_key_parts.append(str(end_date)) cache_key = "_".join(cache_key_parts) cached_data = analytics_cache.get('bing_analytics', cache_key) if cached_data: logger.info(f"Using cached Bing analytics for user {user_id}") return AnalyticsData(**cached_data) logger.info(f"Fetching fresh Bing analytics for user {user_id}") try: # Get services for this user storage_service = self._get_storage_service(user_id) insights_service = self._get_insights_service(user_id) # Get user's Bing connection status token_status = self.bing_service.get_user_token_status(user_id) if not token_status.get('has_active_tokens'): if token_status.get('has_expired_tokens'): return self.create_error_response('Bing Webmaster tokens expired - please reconnect') else: return self.create_error_response('Bing Webmaster not connected') sites = self.bing_service.get_user_sites(user_id) active_tokens = token_status.get('active_tokens', []) if not active_tokens: return self.create_error_response('No active Bing Webmaster tokens available') token_info = active_tokens[0] access_token = token_info.get('access_token') analytics_cache.set('bing_sites', user_id, sites or [], ttl_override=2*60*60) if not access_token: return self.create_error_response('Bing Webmaster access token not available') # Select site: Prefer target_url match, otherwise first site selected_site = sites[0] if sites else None if not selected_site: return self.create_error_response('No Bing sites found') if target_url and sites: logger.info(f"Attempting to match target URL: {target_url}") # Normalize target URL (remove protocol, trailing slash) normalized_target = target_url.replace('https://', '').replace('http://', '').rstrip('/') for site in sites: # Bing uses 'Url' key site_url = site.get('Url', '') normalized_site = site_url.replace('https://', '').replace('http://', '').rstrip('/') if normalized_target in normalized_site or normalized_site in normalized_target: selected_site = site logger.info(f"Found matching Bing site: {site_url}") break site_url_for_storage = selected_site.get('Url', '') if selected_site else '' logger.info(f"Using Bing site URL: {site_url_for_storage}") # Determine date range (defaults to last 30 days) if not end_date: end_date = datetime.now().strftime('%Y-%m-%d') if not start_date: start_date = (datetime.now() - timedelta(days=30)).strftime('%Y-%m-%d') # Compute days for storage/insights services (at least 1) try: dt_end = datetime.strptime(end_date, '%Y-%m-%d') dt_start = datetime.strptime(start_date, '%Y-%m-%d') days_range = max(1, (dt_end - dt_start).days + 1) except Exception: days_range = 30 query_stats = {} try: stored = storage_service.get_analytics_summary(user_id, site_url_for_storage, days=days_range) if stored and isinstance(stored, dict): query_stats = { 'total_clicks': stored.get('summary', {}).get('total_clicks', 0), 'total_impressions': stored.get('summary', {}).get('total_impressions', 0), 'total_queries': stored.get('summary', {}).get('total_queries', 0), 'avg_ctr': stored.get('summary', {}).get('total_ctr', 0), 'avg_position': stored.get('summary', {}).get('avg_position', 0), } except Exception as e: logger.warning(f"Bing analytics: Failed to read stored analytics summary: {e}") # Get enhanced insights insights = self._get_enhanced_insights_with_service(insights_service, user_id, site_url_for_storage) metrics = { 'connection_status': 'connected', 'connected_sites': len(sites), 'sites': sites[:5] if sites else [], 'connected_since': token_info.get('created_at', ''), 'scope': token_info.get('scope', ''), 'total_clicks': query_stats.get('total_clicks', 0), 'total_impressions': query_stats.get('total_impressions', 0), 'total_queries': query_stats.get('total_queries', 0), 'avg_ctr': query_stats.get('avg_ctr', 0), 'avg_position': query_stats.get('avg_position', 0), 'insights': insights, 'note': 'Bing Webmaster API provides SEO insights, search performance, and index status data' } if not sites: result = self.create_partial_response(metrics=metrics, error_message='Connected to Bing; no verified sites found') else: result = self.create_success_response(metrics=metrics, date_range={'start': start_date, 'end': end_date}) analytics_cache.set('bing_analytics', cache_key, result.__dict__) return result except Exception as e: self.log_analytics_error(user_id, "get_analytics", e) error_result = self.create_error_response(str(e)) # Cache error briefly to prevent hammering but recover quickly analytics_cache.set('bing_analytics', cache_key, error_result.__dict__, ttl_override=30) return error_result def _get_enhanced_insights_with_service(self, insights_service: BingInsightsService, user_id: str, site_url: str) -> Dict[str, Any]: """Get enhanced insights using provided service.""" try: if not site_url: return {'status': 'no_site_url', 'message': 'No site URL available for insights'} performance_insights = insights_service.get_performance_insights(user_id, site_url, days=30) seo_insights = insights_service.get_seo_insights(user_id, site_url, days=30) recommendations = insights_service.get_actionable_recommendations(user_id, site_url, days=30) return { 'performance': performance_insights, 'seo': seo_insights, 'recommendations': recommendations, 'last_analyzed': datetime.now().isoformat() } except Exception as e: logger.warning(f"Error getting enhanced insights: {e}") return {'status': 'error', 'message': str(e)} def get_connection_status(self, user_id: str) -> Dict[str, Any]: """Get Bing Webmaster connection status""" self.log_analytics_request(user_id, "get_connection_status") try: bing_connection = self.bing_service.get_connection_status(user_id) return { 'connected': bing_connection.get('connected', False), 'sites_count': bing_connection.get('total_sites', 0), 'sites': bing_connection.get('sites', []), 'error': None } except Exception as e: self.log_analytics_error(user_id, "get_connection_status", e) return { 'connected': False, 'sites_count': 0, 'sites': [], 'error': str(e) } def _extract_user_sites(self, sites_data: Any) -> list: """Extract user sites from Bing API response""" if isinstance(sites_data, dict): if 'd' in sites_data: d_data = sites_data['d'] if isinstance(d_data, dict) and 'results' in d_data: return d_data['results'] elif isinstance(d_data, list): return d_data else: return [] else: return [] elif isinstance(sites_data, list): return sites_data else: return [] async def _get_query_stats(self, user_id: str, sites: list) -> Dict[str, Any]: """Get query statistics for Bing sites""" query_stats = {} logger.info(f"Bing sites found: {len(sites)} sites") if sites: first_site = sites[0] logger.info(f"First Bing site: {first_site}") # Bing API returns URL in 'Url' field (capital U) site_url = first_site.get('Url', '') if isinstance(first_site, dict) else str(first_site) logger.info(f"Extracted site URL: {site_url}") if site_url: try: # Use the Bing service method to get query stats logger.info(f"Getting Bing query stats for site: {site_url}") query_data = self.bing_service.get_query_stats( user_id=user_id, site_url=site_url, start_date=(datetime.now() - timedelta(days=30)).strftime('%Y-%m-%d'), end_date=datetime.now().strftime('%Y-%m-%d'), page=0 ) if "error" not in query_data: logger.info(f"Bing query stats response structure: {type(query_data)}, keys: {list(query_data.keys()) if isinstance(query_data, dict) else 'Not a dict'}") logger.info(f"Bing query stats raw response: {query_data}") # Handle different response structures from Bing API queries = self._extract_queries(query_data) logger.info(f"Bing queries extracted: {len(queries)} queries") if queries and len(queries) > 0: logger.info(f"First query sample: {queries[0] if isinstance(queries[0], dict) else queries[0]}") # Calculate summary metrics total_clicks = sum(query.get('Clicks', 0) for query in queries if isinstance(query, dict)) total_impressions = sum(query.get('Impressions', 0) for query in queries if isinstance(query, dict)) total_queries = len(queries) avg_ctr = (total_clicks / total_impressions * 100) if total_impressions > 0 else 0 avg_position = sum(query.get('AvgClickPosition', 0) for query in queries if isinstance(query, dict)) / total_queries if total_queries > 0 else 0 query_stats = { 'total_clicks': total_clicks, 'total_impressions': total_impressions, 'total_queries': total_queries, 'avg_ctr': round(avg_ctr, 2), 'avg_position': round(avg_position, 2) } logger.info(f"Bing query stats calculated: {query_stats}") else: logger.warning(f"Bing query stats error: {query_data['error']}") except Exception as e: logger.warning(f"Error getting Bing query stats: {e}") return query_stats def _extract_queries(self, query_data: Any) -> list: """Extract queries from Bing API response""" if isinstance(query_data, dict): if 'd' in query_data: d_data = query_data['d'] logger.info(f"Bing 'd' data structure: {type(d_data)}, keys: {list(d_data.keys()) if isinstance(d_data, dict) else 'Not a dict'}") if isinstance(d_data, dict) and 'results' in d_data: return d_data['results'] elif isinstance(d_data, list): return d_data else: return [] else: return [] elif isinstance(query_data, list): return query_data else: return [] def _get_enhanced_insights(self, user_id: str, site_url: str) -> Dict[str, Any]: """Get enhanced insights from stored Bing analytics data""" try: if not site_url: return {'status': 'no_site_url', 'message': 'No site URL available for insights'} # Get performance insights performance_insights = self.insights_service.get_performance_insights(user_id, site_url, days=30) # Get SEO insights seo_insights = self.insights_service.get_seo_insights(user_id, site_url, days=30) # Get actionable recommendations recommendations = self.insights_service.get_actionable_recommendations(user_id, site_url, days=30) return { 'performance': performance_insights, 'seo': seo_insights, 'recommendations': recommendations, 'last_analyzed': datetime.now().isoformat() } except Exception as e: logger.warning(f"Error getting enhanced insights: {e}") return { 'status': 'error', 'message': f'Unable to generate insights: {str(e)}', 'fallback': True }