KillrVideo
diff --git a/‎app/external_services/youtube_metadata.py‎
Lines changed: 87 additions & 47 deletions b/‎app/external_services/youtube_metadata.py‎
Lines changed: 87 additions & 47 deletions
diff --git a/‎app/metrics.py‎
Lines changed: 28 additions & 0 deletions b/‎app/metrics.py‎
Lines changed: 28 additions & 0 deletions
diff --git a/‎app/services/recommendation_service.py‎
Lines changed: 66 additions & 35 deletions b/‎app/services/recommendation_service.py‎
Lines changed: 66 additions & 35 deletions
diff --git a/‎app/services/vector_search_utils.py‎
Lines changed: 32 additions & 12 deletions b/‎app/services/vector_search_utils.py‎
Lines changed: 32 additions & 12 deletions
@@ -63,62 +63,102 @@ async def _fetch_v3_api(
 ) -> YouTubeMetadata:
     """Fetch metadata using the official YouTube Data API v3."""
 
-    url = (
-        "https://www.googleapis.com/youtube/v3/videos?part=snippet"
-        f"&id={youtube_id}&key={api_key}"
-    )
-    async with httpx.AsyncClient(timeout=timeout, follow_redirects=True) as client:
-        resp = await client.get(url)
-        if resp.status_code != 200:
-            raise MetadataFetchError(
-                f"Data API returned HTTP {resp.status_code}: {resp.text[:200]}"
-            )
-        data = resp.json()
-        items = data.get("items") or []
-        if not items:
-            raise MetadataFetchError(
-                "Video not found or no snippet returned from Data API"
-            )
+    # ------------------------------------------------------------------
+    # Observability – manual span & histogram timing
+    # ------------------------------------------------------------------
+
+    from opentelemetry import trace
+    import time
+    from app.metrics import YOUTUBE_FETCH_DURATION_SECONDS
+
+    tracer = trace.get_tracer(__name__)
+
+    start_time = time.perf_counter()
 
-        snippet = items[0].get("snippet") or {}
-        return YouTubeMetadata(
-            title=snippet.get("title", ""),
-            description=snippet.get("description"),
-            thumbnail_url=snippet.get("thumbnails"),  # handled by validator
-            tags=snippet.get("tags", []),
+    with tracer.start_as_current_span("youtube.fetch_v3_api") as span:
+        span.set_attribute("youtube.video_id", youtube_id)
+
+        url = (
+            "https://www.googleapis.com/youtube/v3/videos?part=snippet"
+            f"&id={youtube_id}&key={api_key}"
         )
+        async with httpx.AsyncClient(timeout=timeout, follow_redirects=True) as client:
+            resp = await client.get(url)
+            if resp.status_code != 200:
+                raise MetadataFetchError(
+                    f"Data API returned HTTP {resp.status_code}: {resp.text[:200]}"
+                )
+            data = resp.json()
+            items = data.get("items") or []
+            if not items:
+                raise MetadataFetchError(
+                    "Video not found or no snippet returned from Data API"
+                )
+
+            snippet = items[0].get("snippet") or {}
+            result = YouTubeMetadata(
+                title=snippet.get("title", ""),
+                description=snippet.get("description"),
+                thumbnail_url=snippet.get("thumbnails"),  # handled by validator
+                tags=snippet.get("tags", []),
+            )
+
+            # Record duration & size metrics
+            duration = time.perf_counter() - start_time
+            YOUTUBE_FETCH_DURATION_SECONDS.labels(method="v3_api").observe(duration)
+            span.set_attribute("duration_ms", int(duration * 1000))
+            span.set_attribute("title_length", len(result.title))
+
+            return result
 
 
 async def _fetch_oembed(youtube_id: str, timeout: float) -> YouTubeMetadata:
     """Fetch metadata using YouTube's public oEmbed endpoint."""
 
-    url = (
-        "https://www.youtube.com/oembed?format=json&url="
-        f"https://youtu.be/{youtube_id}"
-    )
-    print(f"DEBUG _fetch_oembed: url={url}")
-    async with httpx.AsyncClient(timeout=timeout, follow_redirects=True) as client:
-        resp = await client.get(url)
-        if resp.status_code != 200:
-            raise MetadataFetchError(
-                f"oEmbed returned HTTP {resp.status_code}: {resp.text[:200]}"
-            )
-        print(f"DEBUG _fetch_oembed: resp={resp.text}")
-        data = resp.json()
-        title = data.get("title")
-        if not title:
-            raise MetadataFetchError("oEmbed response missing title field")
-        thumb = (
-            data.get("thumbnail_url")
-            or f"https://i.ytimg.com/vi/{youtube_id}/hqdefault.jpg"
-        )
+    from opentelemetry import trace
+    import time
+    from app.metrics import YOUTUBE_FETCH_DURATION_SECONDS
+
+    tracer = trace.get_tracer(__name__)
+
+    start_time = time.perf_counter()
 
-        return YouTubeMetadata(
-            title=title,
-            description=None,  # oEmbed does not provide description
-            thumbnail_url=thumb,
-            tags=[],
+    with tracer.start_as_current_span("youtube.fetch_oembed") as span:
+        span.set_attribute("youtube.video_id", youtube_id)
+
+        url = (
+            "https://www.youtube.com/oembed?format=json&url="
+            f"https://youtu.be/{youtube_id}"
         )
+        print(f"DEBUG _fetch_oembed: url={url}")
+        async with httpx.AsyncClient(timeout=timeout, follow_redirects=True) as client:
+            resp = await client.get(url)
+            if resp.status_code != 200:
+                raise MetadataFetchError(
+                    f"oEmbed returned HTTP {resp.status_code}: {resp.text[:200]}"
+                )
+            print(f"DEBUG _fetch_oembed: resp={resp.text}")
+            data = resp.json()
+            title = data.get("title")
+            if not title:
+                raise MetadataFetchError("oEmbed response missing title field")
+            thumb = (
+                data.get("thumbnail_url")
+                or f"https://i.ytimg.com/vi/{youtube_id}/hqdefault.jpg"
+            )
+
+            result = YouTubeMetadata(
+                title=title,
+                description=None,  # oEmbed does not provide description
+                thumbnail_url=thumb,
+                tags=[],
+            )
+
+            duration = time.perf_counter() - start_time
+            YOUTUBE_FETCH_DURATION_SECONDS.labels(method="oembed").observe(duration)
+            span.set_attribute("duration_ms", int(duration * 1000))
+
+            return result
 
 
 # ---------------------------------------------------------------------------
 
@@ -0,0 +1,28 @@
+from prometheus_client import Histogram
+
+# ---------------------------------------------------------------------------
+# Custom Prometheus metrics – exported via /metrics route exposed by
+# prometheus_fastapi_instrumentator in app.utils.observability.configure_observability().
+# ---------------------------------------------------------------------------
+
+ASTRA_DB_QUERY_DURATION_SECONDS = Histogram(
+    "astra_db_query_duration_seconds",
+    "Latency of Astra DB Data API queries (seconds)",
+    ["operation"],
+)
+
+YOUTUBE_FETCH_DURATION_SECONDS = Histogram(
+    "youtube_fetch_duration_seconds",
+    "Latency of YouTube metadata fetches (seconds)",
+    ["method"],
+)
+
+VECTOR_SEARCH_DURATION_SECONDS = Histogram(
+    "vector_search_duration_seconds",
+    "Latency of semantic vector search operations (seconds)",
+)
+
+RECOMMENDATION_DURATION_SECONDS = Histogram(
+    "recommendation_generation_duration_seconds",
+    "Latency of recommendation engine stub (seconds)",
+) 
@@ -24,36 +24,51 @@ async def get_related_videos(
     and assign each a random relevance score.
     """
 
-    # Ensure the referenced video exists – if it does not, we treat the request
-    # as valid but return an empty list. The caller is free to 404 at the API
-    # layer if it wishes to enforce existence – keeping this generic allows the
-    # service to be reused from different contexts.
-    target_video = await video_service.get_video_by_id(video_id)
-    if target_video is None:
-        return []
-
-    latest_summaries, _total = await video_service.list_latest_videos(
-        page=1, page_size=limit + 5
-    )
+    from opentelemetry import trace
+    import time
+    from app.metrics import RECOMMENDATION_DURATION_SECONDS
+
+    tracer = trace.get_tracer(__name__)
+    start_time = time.perf_counter()
+
+    with tracer.start_as_current_span("recommend.related_videos") as span:
+        span.set_attribute("video_id", str(video_id))
+
+        # Ensure the referenced video exists – if it does not, we treat the request
+        # as valid but return an empty list. The caller is free to 404 at the API
+        # layer if it wishes to enforce existence – keeping this generic allows the
+        # service to be reused from different contexts.
+        target_video = await video_service.get_video_by_id(video_id)
+        if target_video is None:
+            return []
+
+        latest_summaries, _total = await video_service.list_latest_videos(
+            page=1, page_size=limit + 5
+        )
 
-    related_items: List[RecommendationItem] = []
-
-    for summary in latest_summaries:
-        if summary.videoId == video_id:
-            # Skip the source video itself
-            continue
-        if len(related_items) >= limit:
-            break
-        related_items.append(
-            RecommendationItem(
-                videoId=summary.videoId,
-                title=summary.title,
-                thumbnailUrl=summary.thumbnailUrl,
-                score=round(random.uniform(0.5, 1.0), 2),
+        related_items: List[RecommendationItem] = []
+
+        for summary in latest_summaries:
+            if summary.videoId == video_id:
+                # Skip the source video itself
+                continue
+            if len(related_items) >= limit:
+                break
+            related_items.append(
+                RecommendationItem(
+                    videoId=summary.videoId,
+                    title=summary.title,
+                    thumbnailUrl=summary.thumbnailUrl,
+                    score=round(random.uniform(0.5, 1.0), 2),
+                )
             )
-        )
 
-    return related_items
+        duration = time.perf_counter() - start_time
+        RECOMMENDATION_DURATION_SECONDS.observe(duration)
+        span.set_attribute("duration_ms", int(duration * 1000))
+        span.set_attribute("result_count", len(related_items))
+
+        return related_items
 
 
 async def get_personalized_for_you_videos(
@@ -68,15 +83,31 @@ async def get_personalized_for_you_videos(
     recommender can be dropped-in later without further API changes.
     """
 
-    # For visibility during development/testing.
-    print(
-        f"STUB: Generating 'For You' feed for user {current_user.userId} (page={page}, page_size={page_size})"
-    )
+    from opentelemetry import trace
+    import time
+    from app.metrics import RECOMMENDATION_DURATION_SECONDS
 
-    videos, total_items = await video_service.list_latest_videos(
-        page=page, page_size=page_size
-    )
-    return videos, total_items
+    tracer = trace.get_tracer(__name__)
+    start_time = time.perf_counter()
+
+    with tracer.start_as_current_span("recommend.for_you") as span:
+        span.set_attribute("user_id", str(current_user.userId))
+
+        # For visibility during development/testing.
+        print(
+            f"STUB: Generating 'For You' feed for user {current_user.userId} (page={page}, page_size={page_size})"
+        )
+
+        videos, total_items = await video_service.list_latest_videos(
+            page=page, page_size=page_size
+        )
+
+        duration = time.perf_counter() - start_time
+        RECOMMENDATION_DURATION_SECONDS.observe(duration)
+        span.set_attribute("duration_ms", int(duration * 1000))
+        span.set_attribute("result_count", total_items)
+
+        return videos, total_items
 
 
 # ---------------------------------------------------------------------------
 
@@ -54,18 +54,29 @@ async def semantic_search_with_threshold(
         for typical thresholds around 0.7-0.9.
     """
 
+    from opentelemetry import trace
+    import time
+    from app.metrics import VECTOR_SEARCH_DURATION_SECONDS
+
+    tracer = trace.get_tracer(__name__)
+
     if page < 1 or page_size < 1:
         return [], 0
 
     # Ask Astra for a generous slice so we can trim client-side.
     overfetch = page_size * overfetch_factor * page  # grow with page number
 
-    cursor = db_table.find(
-        filter={},
-        sort={vector_column: query},
-        limit=overfetch,
-        include_similarity=True,  # ⭐
-    )
+    start_time = time.perf_counter()
+
+    with tracer.start_as_current_span("vector.search") as span:
+        span.set_attribute("query", query[:64])  # truncate long queries for span
+
+        cursor = db_table.find(
+            filter={},
+            sort={vector_column: query},
+            limit=overfetch,
+            include_similarity=True,  # ⭐
+        )
 
     # Fetch docs.
     docs: List[Dict[str, Any]]
@@ -85,13 +96,22 @@ async def semantic_search_with_threshold(
         pre_trim = len(docs)
         docs = [d for d in docs if d.get("$similarity", 0) >= similarity_threshold]
         logger.debug(
-            "Trimmed by threshold %.2f: %s → %s docs", similarity_threshold, pre_trim, len(docs)
+            "Trimmed by threshold %.2f: %s → %s docs",
+            similarity_threshold,
+            pre_trim,
+            len(docs),
         )
 
-    if docs:
-        logger.debug(
-            "Top doc similarity after trim: %.3f", docs[0].get("$similarity", -1.0)
-        )
+        if docs:
+            logger.debug(
+                "Top doc similarity after trim: %.3f", docs[0].get("$similarity", -1.0)
+            )
+
+        # Record metrics
+        duration = time.perf_counter() - start_time
+        VECTOR_SEARCH_DURATION_SECONDS.observe(duration)
+        span.set_attribute("duration_ms", int(duration * 1000))
+        span.set_attribute("total_results", len(docs))
 
     total = len(docs)
 
@@ -102,4 +122,4 @@ async def semantic_search_with_threshold(
 
     summaries = [VideoSummary.model_validate(d) for d in page_docs]
 
-    return summaries, total 
+    return summaries, total