Final_Assignment_Template3

Sleeping

App Files Files Community

Final_Assignment_Template3 / myagent.py

bwilkie

Update myagent.py

a94813f verified about 2 months ago

raw

history blame

3.6 kB

	import os
	from smolagents import CodeAgent, ToolCallingAgent
	from smolagents import OpenAIServerModel
	from tools.fetch import fetch_webpage
	from tools.yttranscript import get_youtube_transcript, get_youtube_title_description
	import myprompts
	from transformers import AutoTokenizer, AutoModelForCausalLM, pipeline

	import torch
	# --- Basic Agent Definition ---
	class BasicAgent:
	def __init__(self):
	print("BasicAgent initialized.")
	def __call__(self, question: str) -> str:

	print(f"Agent received question (first 50 chars): {question[:50]}...")

	try:
	# Use the reviewer agent to determine if the question can be answered by a model or requires code
	print("Calling reviewer agent...")
	reviewer_answer = reviewer_agent.run(myprompts.review_prompt + "\nThe question is:\n" + question)
	print(f"Reviewer agent answer: {reviewer_answer}")

	question = question + '\n' + myprompts.output_format
	fixed_answer = ""

	if reviewer_answer == "code":
	fixed_answer = gaia_agent.run(question)
	print(f"Code agent answer: {fixed_answer}")

	elif reviewer_answer == "model":
	# If the reviewer agent suggests using the model, we can proceed with the model agent
	print("Using model agent to answer the question.")
	fixed_answer = model_agent.run(myprompts.model_prompt + "\nThe question is:\n" + question)
	print(f"Model agent answer: {fixed_answer}")

	return fixed_answer
	except Exception as e:
	error = f"An error occurred while processing the question: {e}"
	print(error)
	return error




	# Create a wrapper class that matches the expected interface
	class LocalLlamaModel:
	def __init__(self, model, tokenizer):
	self.model = model
	self.tokenizer = tokenizer
	self.device = model.device if hasattr(model, 'device') else 'cpu'

	def generate(self, prompt: str, max_new_tokens=512, **kwargs):
	"""Generate text using the local model"""
	input_ids = self.tokenizer(prompt, return_tensors="pt").input_ids.to(self.device)

	with torch.no_grad():
	output_ids = self.model.generate(
	input_ids,
	max_new_tokens=max_new_tokens,
	do_sample=True,
	temperature=0.7,
	pad_token_id=self.tokenizer.eos_token_id,
	**kwargs
	)

	# Decode only the new tokens (excluding the input)
	new_tokens = output_ids[0][input_ids.shape[1]:]
	output = self.tokenizer.decode(new_tokens, skip_special_tokens=True)
	return output

	def __call__(self, prompt: str, max_new_tokens=512, **kwargs):
	"""Make the model callable like a function"""
	return self.generate(prompt, max_new_tokens, **kwargs)

	# Create the model instance
	model = LocalLlamaModel(model_init, tokenizer)

	# Now create your agents - these should work with the wrapped model
	reviewer_agent = ToolCallingAgent(model=model, tools=[])
	model_agent = ToolCallingAgent(model=model, tools=[fetch_webpage])
	gaia_agent = CodeAgent(
	tools=[fetch_webpage, get_youtube_title_description, get_youtube_transcript],
	model=model
	)

	if __name__ == "__main__":
	# Example usage
	question = "What was the actual enrollment of the Malko competition in 2023?"
	agent = BasicAgent()
	answer = agent(question)
	print(f"Answer: {answer}")