Final_Assignment_Template

Running

Markiian Tsalyk

upd

36a7313 2 months ago

9.72 kB

	from smolagents import DuckDuckGoSearchTool, GoogleSearchTool
	from youtube_transcript_api import YouTubeTranscriptApi
	from supadata import Supadata, SupadataError
	import wikipedia
	from wikipedia_tables_parser import fetch_wikipedia_tables
	import pandas as pd
	from typing import Any
	import os
	from dotenv import load_dotenv

	load_dotenv()
	import importlib.util
	import sys
	import io
	import contextlib
	from llama_index.llms.openrouter import OpenRouter
	from llama_index.core.types import ChatMessage


	llm = OpenRouter(
	api_key=os.getenv("OPENROUTER_API_KEY"),
	model="google/gemini-2.5-flash-preview",
	temperature=0.7,
	)
	supadata = Supadata(api_key=os.getenv("SUPADATA_API_KEY"))


	def reverse_text(text: str, **kwargs) -> str:
	"""
	Returns the reversed version of the text.
	If you receive some unknown text, that can't be recognized and analyzed, then you need to use this tool to make it clear.

	Args:
	text: text to be reversed

	Return:
	The reversed text.
	"""
	try:
	print(text[::-1])
	return text[::-1]
	except Exception as e:
	raise ValueError(f"Can't reverse text: {e}")


	def fetch_historical_event_data(event_name: str, year: str, **kwargs) -> str:
	"""
	Fetches data about historical event that occured in certain year.
	Some examples of events: Olympics games, Footbal games, NBA etc.

	Args:
	event_name: String name of the event
	year: String year of the event

	Return:
	String with data about the event
	"""
	result = wikipedia.page(f"{event_name} in {year}")

	url = result.url
	content = result.content
	try:
	tables = pd.read_html(url)
	except Exception as e:
	tables = fetch_wikipedia_tables(url)

	result = f"Content: {content}\nTables: {tables}"

	return result


	def classify_fruit_vegitable(item: str, **kwargs) -> str:
	"""
	Classifies items to fruits and vegitables

	Args:
	item: Item to classify

	Returns:
	Text with explanation whether it is a fruit or vegetable.
	"""
	response = llm.chat(
	messages=[
	ChatMessage(
	content=f"Classify whether it is fruit or vegetable: {item}. Return only `fruit` or `vegetable` without explanations"
	)
	]
	)
	return response.message.content


	def web_search(query: str, **kwargs) -> str:
	"""
	Returns web search results for the provided query.
	Don't use it for Wikipedia queries. For Wikipedia queries use wikipedia_search tool.
	Important, query is human-language string input, not the URL or key.

	Args:
	query: query to search in WEB

	Return:
	String with web search results.
	"""
	result = DuckDuckGoSearchTool().forward(query)
	# result = GoogleSearchTool(provider="serpapi").forward(query)
	print(result)
	return result


	def wikipedia_search(query: str, **kwargs) -> Any:
	"""
	Returns wikipedia search results for the provided query.

	Args:
	query: query to search in WIKIPEDIA

	Return:
	Wikipedia search results.
	"""
	result = wikipedia.page(query)

	url = result.url
	content = result.content
	try:
	tables = pd.read_html(url)
	except:
	tables = fetch_wikipedia_tables(url)

	result = f"Content: {content}\nTables: {tables}"

	return result


	def multiply(a: float, b: float, **kwargs) -> float:
	"""
	Multiply two numbers.

	Args:
	a: First number
	b: Second number

	Return:
	The product of the two numbers.
	"""
	return a * b


	def compute_sum(values: list[int \| float], **kwargs) -> float:
	"""
	Computes sum of provided values

	Args:
	values: list of integer or float values
	Return:
	Sum of the values
	"""
	return sum(values)


	def length(iterable: Any, **kwargs) -> int:
	"""
	Return the length of an iterable.

	Args:
	iterable: Any iterable

	Return:
	The length of the iterable.
	"""
	return len(iterable)


	def execute_python_file(file_path: str) -> Any:
	"""
	Executes a Python file and returns its result.

	This function takes a path to a Python file, executes it by importing it as a module,
	and returns the result. The file should contain a function call that produces
	the result to be returned. This version also executes code under the
	'if __name__ == "__main__":' block.

	Args:
	file_path (str): Path to the Python file to execute.

	Returns:
	Any: The result of executing the Python file. If the file sets a variable
	named 'result', that value will be returned.

	Raises:
	FileNotFoundError: If the specified file does not exist.
	ImportError: If there was an error importing the Python file.

	Example:
	>>> # If example.py contains: result = 2 + 3
	>>> execute_python_file('example.py')
	5
	"""
	# Verify file exists
	if not os.path.isfile(file_path):
	raise FileNotFoundError(f"File not found: {file_path}")

	# Get the directory and filename
	file_dir = os.path.dirname(os.path.abspath(file_path))
	file_name = os.path.basename(file_path)
	module_name = file_name.replace(".py", "")

	# Store original sys.path and add the file's directory
	original_sys_path = sys.path.copy()
	sys.path.insert(0, file_dir)

	# Prepare stdout/stderr capture
	stdout_capture = io.StringIO()
	stderr_capture = io.StringIO()

	# First approach: Import normally to get module definitions
	try:
	spec = importlib.util.spec_from_file_location(module_name, file_path)
	if spec is None or spec.loader is None:
	raise ImportError(f"Could not load module spec from {file_path}")

	module = importlib.util.module_from_spec(spec)
	sys.modules[module_name] = module

	# Execute the module
	with contextlib.redirect_stdout(stdout_capture), contextlib.redirect_stderr(
	stderr_capture
	):
	spec.loader.exec_module(module)

	# After module is loaded, directly execute the main block by reading the file
	# and executing the content with __name__ = "__main__"
	with open(file_path, "r") as f:
	file_content = f.read()
	# Create a namespace with everything from the module
	namespace = {**module.__dict__}
	namespace["__name__"] = "__main__"
	exec(file_content, namespace)

	if hasattr(module, "result"):
	return module.result
	else:
	output = stdout_capture.getvalue().strip()
	print(f"RESULT PYTHON: {output}")
	return output

	except Exception as e:
	error_output = stderr_capture.getvalue()
	if error_output:
	raise type(e)(f"{str(e)}\nProgram output: {error_output}") from None
	else:
	raise
	finally:
	sys.path = original_sys_path

	if module_name in sys.modules:
	del sys.modules[module_name]


	def trascript_youtube(video_id: str, **kwargs) -> str:
	"""
	Returns transcript of YouTube video.

	Args:
	video_id: ID of youtube video (Pass in the video ID, NOT the video URL. For a video with the URL https://www.youtube.com/watch?v=12345 the ID is 12345.)

	Return:
	Transcript of YouTube video.
	"""
	transcript = supadata.youtube.transcript(video_id=video_id, lang="en")

	return transcript.content


	def read_excel(path: str, **kwargs) -> pd.DataFrame:
	"""
	Reads xlsx file

	Args:
	path: path to xlsx file

	Return:
	Pandas dataframe
	"""
	return pd.read_excel(path)


	def pandas_column_sum(
	pandas_column_values: list[int \| float], column_name: str, **kwargs
	) -> float:
	"""
	Computes sum on pandas dataframe column

	Args:
	pandas_column_values: List with float or integer pandas values
	column_name: Name of the column

	Return:
	Sum of the column
	"""
	return sum(pandas_column_values)


	def final_answer(answer: str, **kwargs) -> str:
	"""
	Prepare the final answer for the user. It should be always used as a last step.

	Args:
	answer: The answer to format and return to the user
	Return:
	The final answer.
	"""
	resp = llm.chat(
	messages=[
	ChatMessage(
	content=f"""
	Final answer from agent: {answer}
	Make final answer as short as possible.
	Final answer should be a number or as few words as possible or a comma separated list of numbers and/or strings. If you are asked for a number, don't use comma to write your number neither use units such as $ or percent sign unless specified otherwise. If you are asked for a string, don't use articles, neither abbreviations (e.g. for cities), and write the digits in plain text unless specified otherwise. If you are asked for a comma separated list, apply the above rules depending of whether the element to be put in the list is a number or a string.
	There might be requested exact number, then you need to compress the output so that it was only number without any comments or explanations (float or integer).
	And on the other hand, the question might request some exact string value. Don't explain it, just return this value (For example, insted of `In response to the question, desired person is X` return only `X`)
	Again, you don't need to modify or solve answer, you just need to format it properly.
	"""
	)
	]
	)
	return resp.message.content


	# print(wikipedia_search("Mercedes Sosa studio albums"))
	# execute_python_file("f918266a-b3e0-4914-865d-4faa564f1aef.py")