Spaces:

vikramvasudevan
/

sanatan_ai

Running on CPU Upgrade

App Files Files Community

sanatan_ai / modules /youtube_metadata /answerer.py

vikramvasudevan

Upload folder using huggingface_hub

73a6587 verified about 2 months ago

raw

history blame contribute delete

4.05 kB

	# -------------------------------
	# 4. Answerer
	# -------------------------------
	from typing import List
	from pydantic import BaseModel
	from openai import OpenAI
	from modules.youtube_metadata.db import get_youtube_metadata_collection
	from modules.youtube_metadata.retriever import retrieve_videos


	# -------------------------------
	# Structured Output Classes
	# -------------------------------
	class VideoItem(BaseModel):
	video_id: str
	title: str
	channel: str
	description: str


	class LLMAnswer(BaseModel):
	answer_text: str
	top_videos: List[VideoItem]


	# -------------------------------
	# Main Function
	# -------------------------------
	def answer_query(
	query: str, top_k: int = 5, channel_id: str = None
	) -> LLMAnswer:
	"""
	Answer a user query using YouTube video metadata.
	Returns an LLMAnswer object with textual answer + list of videos.
	"""
	collection = get_youtube_metadata_collection()
	results = retrieve_videos(query, collection, top_k=top_k, channel_id=channel_id)

	if not results:
	return LLMAnswer(answer_text="No relevant videos found.", top_videos=[])

	# Build context lines for the LLM
	context_lines = []
	for r in results:
	if not isinstance(r, dict):
	continue
	vid_id = r.get("video_id", "")
	title = r.get("video_title") or r.get("title", "")
	channel = r.get("channel") or r.get("channel_title", "")
	description = r.get("description", "")
	context_lines.append(
	f"- {title} ({channel}) (https://youtube.com/watch?v={vid_id})\n description: {description}"
	)

	context_text = "\n".join(context_lines)

	# Call LLM with structured output
	client = OpenAI()
	response = client.chat.completions.parse(
	model="gpt-4o-mini",
	messages=[
	{
	"role": "system",
	"content": (
	"You are a helpful assistant that answers questions using YouTube video metadata. "
	"Return your response strictly as the LLMAnswer class, including 'answer_text' and a list of only the most relevant 'top_videos'.\n"
	"- `answer_text` MUST be very short and concise in natural language (max 100 words).\n"
	"- Use `top_videos` to include only the top 3 most relevant items from context.\n"
	"- Do not include all items unless all are clearly relevant.\n"
	"- Do not makeup `description`. Use the exact descriptions as given in the context"
	),
	},
	{
	"role": "user",
	"content": f"Question: {query}\n\nCandidate videos:\n{context_text}\n\nPick only the relevant ones.",
	},
	],
	response_format=LLMAnswer,
	)

	llm_answer = response.choices[0].message.parsed
	answer_text = "\n## Answer : \n" + llm_answer.answer_text
	video_html = build_video_html(llm_answer.top_videos)
	return answer_text, video_html


	def build_video_html(videos: list[VideoItem]) -> str:
	"""Build a clean HTML table from top_videos."""
	if not videos:
	return "<p>No relevant videos found.</p>"

	html = """
	<table border="1" style="border-collapse: collapse; width: 100%;">
	<tr>
	<th>Description</th>
	<th>Watch</th>
	</tr>
	"""
	for v in videos:
	embed_html = f"""
	<div style="margin-bottom: 20px;">
	<strong>{v.title}</strong> ({v.channel})<br>
	<iframe width="360" height="203"
	src="https://www.youtube.com/embed/{v.video_id}"
	frameborder="0"
	allow="accelerometer; autoplay; clipboard-write; encrypted-media; gyroscope; picture-in-picture"
	allowfullscreen>
	</iframe>
	</div>
	"""
	html += f"""
	<tr>
	<td>{v.description}</td>
	<td>{embed_html}</td>
	</tr>
	"""
	html += "</table>"
	return html