Final_Assignment_Template

Sleeping

App Files Files Community

Final_Assignment_Template / agent.py

janjibDEV

50% on GAIA benchmark

bd1c4e8 12 months ago

Raw

History Blame

5.31 kB

	from smolagents import CodeAgent, LiteLLMModel, DuckDuckGoSearchTool, PythonInterpreterTool, FinalAnswerTool, VisitWebpageTool, tool
	import os
	import wikipediaapi
	from youtubesearchpython import VideosSearch
	from youtube_transcript_api import YouTubeTranscriptApi, NoTranscriptFound, TranscriptsDisabled
	import pandas as pd

	wiki_api = wikipediaapi.Wikipedia(
	language='en',
	user_agent="MyAgent/1.0 (contact@example.com)"
	)

	@tool
	def search_youtube_video(query: str) -> str:
	"""
	Searches YouTube and returns the title and URL of the top result.

	Args:
	query (str): The search term to look up on YouTube.

	Returns:
	str: The title and URL of the top video result.

	"""
	print(f"--- Executing Youtube with query: '{query}' ---")
	try:
	search = VideosSearch(query, limit=1)
	top_result = search.result()['result'][0]
	video_id = top_result['id']
	video_title = top_result['title']
	video_url = f"https://www.youtube.com/watch?v={video_id}"
	return f"Title: {video_title}\nURL: {video_url}"
	except IndexError:
	return "Error: No YouTube videos found for that query."
	except Exception as e:
	return f"An unknown error occurred during Youtube: {e}"

	@tool
	def get_youtube_transcript(video_url: str) -> str:
	"""
	Extracts and returns the full transcript of a YouTube video.

	Args:
	video_url (str): The full URL of the YouTube video.

	Returns:
	str: The transcript text, or an error message if unavailable.
	"""
	print(f"--- Executing YouTube Transcript Tool for URL: '{video_url}' ---")
	try:
	# Extract video ID from URL
	if "watch?v=" in video_url:
	video_id = video_url.split("watch?v=")[1].split("&")[0]
	elif "youtu.be/" in video_url:
	video_id = video_url.split("youtu.be/")[1].split("?")[0]
	else:
	return "Error: Invalid YouTube URL format."

	# Fetch the transcript
	transcript_list = YouTubeTranscriptApi.get_transcript(video_id)

	# Combine transcript segments into a single block of text
	full_transcript = " ".join([item['text'] for item in transcript_list])

	return full_transcript
	except NoTranscriptFound:
	return "Error: No transcript could be found for this video."
	except TranscriptsDisabled:
	return "Error: Transcripts are disabled for this video."
	except Exception as e:
	return f"An unknown error occurred while fetching the transcript: {e}"

	@tool
	def get_wikipedia_summary(query: str) -> str:
	"""
	Fetches and returns the summary of a Wikipedia article.

	Args:
	query (str): The title or topic of the Wikipedia article to search.

	Returns:
	str: The summary text of the article, or an error message if not found.
	"""
	print(f"--- Executing Wikipedia Tool with query: '{query}' ---")
	page = wiki_api.page(query)
	if not page.exists():
	return f"Error: The Wikipedia page for '{query}' could not be found."
	return f"Title: {page.title}\n\nSummary:\n{page.summary}"

	@tool
	def analyze_excel_file(file_path: str, query: str) -> str:
	"""
	Analyze an Excel file using pandas and answer a question about it.
	Args:
	file_path (str): the path to the Excel file.
	query (str): Question about the data
	"""
	try:
	# Read the Excel file
	df = pd.read_excel(file_path)

	# Run various analyses based on the query
	result = (
	f"Excel file loaded with {len(df)} rows and {len(df.columns)} columns.\n"
	)
	result += f"Columns: {', '.join(df.columns)}\n\n"

	# Add summary statistics
	result += "Summary statistics:\n"
	result += str(df.describe())

	return result

	except Exception as e:
	return f"Error analyzing Excel file: {str(e)}"

	class BasicAgent:
	def __init__(self):


	model = LiteLLMModel(model_id="gpt-4.1-2025-04-14")


	self.agent = CodeAgent(
	model=model,
	tools=[DuckDuckGoSearchTool(),
	PythonInterpreterTool(),
	FinalAnswerTool(),
	VisitWebpageTool(),
	search_youtube_video,
	get_youtube_transcript,
	get_wikipedia_summary,
	analyze_excel_file],
	additional_authorized_imports=['numpy','csv','xlrd','openpyxl','pandas','markdownify','requests'],
	add_base_tools=False,
	max_steps=10,
	)




	def __call__(self, question: str) -> str:

	custom_prompt = ("""
	__CONSTRAINTS__
	- DO NOT start with an intro or include an outro.
	""")

	print(f"Agent received question (first 50 chars): {question[:50]}...")
	result = self.agent.run(custom_prompt + question)

	print("Raw result:", result)

	if isinstance(result, dict) and "output" in result:
	final_str = str(result["output"]).strip()
	elif hasattr(result, "output"):
	final_str = str(result.output).strip()
	else:
	final_str = str(result).strip()

	return final_str