Spaces:

vikramvasudevan
/

youtube-channel-surfer-ai

Running

App Files Files Community

youtube-channel-surfer-ai / modules /answerer.py

vikramvasudevan

Upload folder using huggingface_hub

b36dab2 verified about 1 month ago

raw

history blame

3.76 kB

	# -------------------------------
	# 4. Answerer
	# -------------------------------
	from typing import List
	from pydantic import BaseModel
	from openai import OpenAI
	from modules.retriever import retrieve_videos


	# -------------------------------
	# Structured Output Classes
	# -------------------------------
	class VideoItem(BaseModel):
	video_id: str
	title: str
	channel: str
	description: str


	class LLMAnswer(BaseModel):
	answer_text: str
	top_videos: List[VideoItem]


	# -------------------------------
	# Main Function
	# -------------------------------
	def answer_query(query: str, collection, top_k: int = 5) -> LLMAnswer:
	"""
	Answer a user query using YouTube video metadata.
	Returns an LLMAnswer object with textual answer + list of videos.
	"""
	results = retrieve_videos(query, collection, top_k=top_k)

	if not results:
	return LLMAnswer(answer_text="No relevant videos found.", top_videos=[])

	# Build context lines for the LLM
	context_lines = []
	for r in results:
	if not isinstance(r, dict):
	continue
	vid_id = r.get("video_id", "")
	title = r.get("video_title") or r.get("title", "")
	channel = r.get("channel") or r.get("channel_title", "")
	description = r.get("description", "")
	context_lines.append(
	f"- {title} ({channel}) (https://youtube.com/watch?v={vid_id})\n description: {description}"
	)

	context_text = "\n".join(context_lines)

	# Call LLM with structured output
	client = OpenAI()
	response = client.chat.completions.parse(
	model="gpt-4o-mini",
	messages=[
	{
	"role": "system",
	"content": (
	"You are a helpful assistant that answers questions using YouTube video metadata. "
	"Return your response strictly as the LLMAnswer class, including 'answer_text' and a list of only the most relevant 'top_videos'.\n"
	"- `answer_text` MUST be very short and concise in natural language (max 1–2 sentences).\n"
	"- Use `top_videos` to include only the 2–3 most relevant items from context.\n"
	"- Do not include all items unless all are clearly relevant.\n"
	),
	},
	{
	"role": "user",
	"content": f"Question: {query}\n\nCandidate videos:\n{context_text}\n\nPick only the relevant ones.",
	},
	],
	response_format=LLMAnswer,
	)

	llm_answer = response.choices[0].message.parsed
	answer_text = llm_answer.answer_text
	video_html = build_video_html(llm_answer.top_videos)
	return answer_text, video_html



	def build_video_html(videos: list[VideoItem]) -> str:
	"""Build a clean HTML table from top_videos."""
	if not videos:
	return "<p>No relevant videos found.</p>"

	html = """
	<table border="1" style="border-collapse: collapse; width: 100%;">
	<tr>
	<th>Description</th>
	<th>Watch</th>
	</tr>
	"""
	for v in videos:
	embed_html = f"""
	<div style="margin-bottom: 20px;">
	<strong>{v.title}</strong> ({v.channel})<br>
	<iframe width="360" height="203"
	src="https://www.youtube.com/embed/{v.video_id}"
	frameborder="0"
	allow="accelerometer; autoplay; clipboard-write; encrypted-media; gyroscope; picture-in-picture"
	allowfullscreen>
	</iframe>
	</div>
	"""
	html += f"""
	<tr>
	<td>{v.description}</td>
	<td>{embed_html}</td>
	</tr>
	"""
	html += "</table>"
	return html