GAIA Agent Deployment
Deploy Complete Enhanced GAIA Agent with Phase 1-6 Improvements
9a6a4dc
"""Enhanced GAIA Agent - Complete Phase 1-6 Deployment"""
import os
import gradio as gr
import requests
import pandas as pd
import sys
import traceback
from pathlib import Path
from typing import Optional, List, Union
# Load environment variables from .env file if it exists
def load_env_file():
"""Load environment variables from .env file if it exists."""
env_file = Path('.env')
if env_file.exists():
with open(env_file, 'r') as f:
for line in f:
line = line.strip()
if line and not line.startswith('#') and '=' in line:
key, value = line.split('=', 1)
os.environ[key.strip()] = value.strip()
# Load environment variables at startup
load_env_file()
# Environment setup for HuggingFace Space deployment
def setup_environment():
"""Setup environment variables for HuggingFace Space deployment."""
print("Setting up environment for HuggingFace Space...")
# Check if we're running in HuggingFace Space
space_host = os.getenv("SPACE_HOST")
space_id = os.getenv("SPACE_ID")
if space_host or space_id:
print(f"βœ… Running in HuggingFace Space: {space_id}")
print(f"βœ… Space host: {space_host}")
else:
print("ℹ️ Running locally or environment variables not set")
# Verify API keys are available (they should be in HF Spaces secrets)
required_keys = ["MISTRAL_API_KEY", "EXA_API_KEY", "FIRECRAWL_API_KEY"]
missing_keys = []
for key in required_keys:
if os.getenv(key):
print(f"βœ… {key} found in environment")
else:
print(f"⚠️ {key} not found in environment")
missing_keys.append(key)
if missing_keys:
print(f"⚠️ Missing API keys: {missing_keys}")
print("ℹ️ These should be set as HuggingFace Spaces secrets")
return len(missing_keys) == 0
# Initialize environment
ENV_READY = setup_environment()
# Import Complete Enhanced GAIA Agent
try:
from agents.complete_enhanced_gaia_agent import enhanced_gaia_agent
ENHANCED_AGENT_AVAILABLE = True
print("βœ… Successfully imported Complete Enhanced GAIA Agent (Phase 1-6)")
print(f"πŸ“Š Agent status: {enhanced_gaia_agent.get_status()}")
except Exception as e:
print(f"❌ Could not import Complete Enhanced GAIA Agent: {e}")
print("Traceback:", traceback.format_exc())
ENHANCED_AGENT_AVAILABLE = False
# Fallback to original agent if enhanced version fails
if not ENHANCED_AGENT_AVAILABLE:
try:
from agents.enhanced_unified_agno_agent import GAIAAgent
FALLBACK_AGNO_AVAILABLE = True
print("βœ… Fallback: Successfully imported Enhanced Unified AGNO Agent")
except Exception as e:
print(f"❌ Could not import fallback agent: {e}")
FALLBACK_AGNO_AVAILABLE = False
else:
FALLBACK_AGNO_AVAILABLE = False
# Constants
DEFAULT_API_URL = "https://agents-course-unit4-scoring.hf.space"
class DeploymentReadyGAIAAgent:
"""Complete Enhanced GAIA Agent with Phase 1-6 capabilities."""
def __init__(self):
print("DeploymentReadyGAIAAgent initializing...")
# Try enhanced agent first
if ENHANCED_AGENT_AVAILABLE and ENV_READY:
try:
self.agent = enhanced_gaia_agent
print("πŸš€ Using Complete Enhanced GAIA Agent with Phase 1-6 improvements")
print(f"πŸ“Š Total tools available: {self.agent.get_status()['total_tools']}")
self.agent_type = "complete_enhanced"
except Exception as e:
print(f"❌ Complete Enhanced GAIA Agent initialization failed: {e}")
print("πŸ”„ Falling back to original agent...")
# Fall back to original agent
if FALLBACK_AGNO_AVAILABLE:
try:
self.agent = GAIAAgent()
print("πŸš€ Using Enhanced Unified AGNO Agent (fallback)")
self.agent_type = "fallback_agno"
except Exception as e2:
print(f"❌ Fallback agent initialization also failed: {e2}")
raise RuntimeError(f"Both agents failed: Enhanced={e}, Fallback={e2}")
else:
raise RuntimeError(f"Enhanced agent failed and fallback not available: {e}")
elif FALLBACK_AGNO_AVAILABLE and ENV_READY:
try:
self.agent = GAIAAgent()
print("πŸš€ Using Enhanced Unified AGNO Agent (fallback)")
self.agent_type = "fallback_agno"
except Exception as e:
print(f"❌ Fallback agent initialization failed: {e}")
raise RuntimeError(f"Fallback agent required but failed to initialize: {e}")
else:
missing_reqs = []
if not ENHANCED_AGENT_AVAILABLE and not FALLBACK_AGNO_AVAILABLE:
missing_reqs.append("No agent available (both enhanced and fallback import failed)")
if not ENV_READY:
missing_reqs.append("Environment not ready (check API keys)")
error_msg = f"Agent not available: {', '.join(missing_reqs)}"
print(f"❌ {error_msg}")
print("πŸ’‘ Required: MISTRAL_API_KEY, EXA_API_KEY, FIRECRAWL_API_KEY")
raise RuntimeError(error_msg)
def __call__(self, question: str, files: Optional[List[Union[str, dict]]] = None) -> str:
print(f"Agent ({self.agent_type}) received question: {question[:100]}...")
if files:
print(f"Agent received {len(files)} files: {files}")
try:
# Pass files to the underlying agent if it supports them
if hasattr(self.agent, '__call__') and 'files' in self.agent.__call__.__code__.co_varnames:
answer = self.agent(question, files)
else:
# Fallback for agents that don't support files parameter
answer = self.agent(question)
print(f"Agent response: {answer}")
return answer
except Exception as e:
print(f"Error in DeploymentReadyGAIAAgent: {e}")
traceback.print_exc()
return "unknown"
def run_and_submit_all(profile: gr.OAuthProfile | None):
"""Fetch questions, run agent, submit answers, and display results."""
# Determine HF Space Runtime URL and Repo URL
space_id = os.getenv("SPACE_ID", "JoachimVC/gaia-enhanced-agent")
if profile:
username = f"{profile.username}"
print(f"User logged in: {username}")
else:
print("User not logged in.")
return "Please Login to Hugging Face with the button.", None
# Determine agent_code URL
agent_code = f"https://huggingface.co/spaces/{space_id}/tree/main"
print(f"Agent code URL: {agent_code}")
# API URLs
api_base = DEFAULT_API_URL
questions_url = f"{api_base}/questions"
submit_url = f"{api_base}/submit"
try:
# 1. Fetch Questions
print("Fetching questions...")
response = requests.get(questions_url, timeout=30)
response.raise_for_status()
questions_data = response.json()
print(f"Fetched {len(questions_data)} questions.")
# 2. Initialize Agent
agent = DeploymentReadyGAIAAgent()
# 3. Process Questions
results_log = []
answers_payload = []
print(f"Running enhanced agent on {len(questions_data)} questions...")
for i, question_data in enumerate(questions_data):
task_id = question_data.get("task_id", f"task_{i}")
question_text = question_data.get("question", "")
file_name = question_data.get("file_name", "")
print(f"Processing question {i+1}/{len(questions_data)}: {task_id}")
if file_name:
print(f"πŸ“Ž Question has attached file: {file_name}")
try:
# Prepare files list if file is attached
files = None
if file_name and file_name.strip():
files = [file_name.strip()]
print(f"πŸ“ Passing file to agent: {files}")
# Call agent with files if available
if files:
submitted_answer = agent(question_text, files)
else:
submitted_answer = agent(question_text)
answers_payload.append({"task_id": task_id, "submitted_answer": submitted_answer})
results_log.append({"Task ID": task_id, "Question": question_text, "Submitted Answer": submitted_answer})
except Exception as e:
print(f"Error processing question {task_id}: {e}")
traceback.print_exc()
error_answer = "unknown"
answers_payload.append({"task_id": task_id, "submitted_answer": error_answer})
results_log.append({"Task ID": task_id, "Question": question_text, "Submitted Answer": error_answer})
if not answers_payload:
print("Agent did not produce any answers to submit.")
return "No answers to submit.", pd.DataFrame()
# 4. Prepare Submission
submission_data = {"username": username.strip(), "agent_code": agent_code, "answers": answers_payload}
status_update = f"Enhanced agent finished. Submitting {len(answers_payload)} answers for user '{username}'..."
print(status_update)
# 5. Submit
print(f"Submitting {len(answers_payload)} answers to: {submit_url}")
response = requests.post(submit_url, json=submission_data, timeout=30)
# Enhanced error handling for 422 errors
if response.status_code == 422:
print(f"422 Unprocessable Entity Error Details:")
print(f"Response text: {response.text}")
try:
error_details = response.json()
print(f"Error JSON: {error_details}")
except:
print("Could not parse error response as JSON")
response.raise_for_status()
final_status = response.text
print(f"Submission successful: {final_status}")
results_df = pd.DataFrame(results_log)
return final_status, results_df
except requests.exceptions.HTTPError as e:
error_detail = f"Server responded with status {e.response.status_code}."
try:
error_json = e.response.json()
error_detail += f" Detail: {error_json.get('detail', e.response.text)}"
except requests.exceptions.JSONDecodeError:
error_detail += f" Response: {e.response.text[:500]}"
status_message = f"Submission Failed: {error_detail}"
print(status_message)
results_df = pd.DataFrame(results_log) if 'results_log' in locals() else pd.DataFrame()
return status_message, results_df
except Exception as e:
status_message = f"An unexpected error occurred: {e}"
print(status_message)
traceback.print_exc()
results_df = pd.DataFrame(results_log) if 'results_log' in locals() else pd.DataFrame()
return status_message, results_df
# Gradio Interface
with gr.Blocks() as demo:
gr.Markdown("# Complete Enhanced GAIA Agent - Phase 1-6 Deployment")
gr.Markdown(
"""
**πŸš€ Complete Enhanced GAIA Agent with All Phase 1-6 Improvements**
**Instructions:**
1. Log in to your Hugging Face account using the button below.
2. Click 'Run Evaluation & Submit All Answers' to test the complete enhanced system.
**✨ Phase 1-6 Enhanced Capabilities:**
**Phase 1 - Web Research Enhancement:**
- βœ… Advanced web search with Exa API integration
- βœ… Specialized Wikipedia research tools
- βœ… Multi-source research orchestration
- βœ… AGNO-compatible research wrappers
**Phase 2 - Audio Processing Implementation:**
- βœ… Audio transcription with Faster-Whisper (European open-source)
- βœ… Recipe and educational content analysis
- βœ… Multi-format audio support
**Phase 3 - Mathematical Code Execution:**
- βœ… Advanced mathematical engine with SymPy
- βœ… Secure Python code execution
- βœ… AST parsing and code analysis
- βœ… AGNO-compatible math tools
**Phase 4 - Excel Data Analysis Enhancement:**
- βœ… Advanced Excel file processing
- βœ… Financial calculations and analysis
- βœ… Excel formula evaluation
**Phase 5 - Advanced Video Analysis Enhancement:**
- βœ… Object detection and counting
- βœ… Computer vision engine
- βœ… Scene analysis and description
**Phase 6 - Complex Text Processing Enhancement:**
- βœ… RTL (Right-to-Left) text processing
- βœ… Multi-orientation OCR
- βœ… Advanced linguistic pattern recognition
**🎯 Expected Performance:**
- **Baseline:** 6/20 questions (30%)
- **Enhanced Target:** 16-18/20 questions (80-90%)
- **Improvement Factor:** 2.5-3x performance increase
**πŸ”§ Technical Features:**
- βœ… 28+ tools with graceful degradation
- βœ… European open-source compliance
- βœ… Zero temperature for consistent results
- βœ… Comprehensive error handling
- βœ… AGNO native orchestration
"""
)
gr.LoginButton()
run_button = gr.Button("Run Evaluation & Submit All Answers")
status_output = gr.Textbox(label="Run Status / Submission Result", lines=5, interactive=False)
results_table = gr.DataFrame(label="Questions and Agent Answers", wrap=True)
run_button.click(
fn=run_and_submit_all,
outputs=[status_output, results_table]
)
if __name__ == "__main__":
print("\n" + "-"*30 + " Enhanced GAIA Agent Starting " + "-"*30)
space_host_startup = os.getenv("SPACE_HOST")
space_id_startup = os.getenv("SPACE_ID")
if space_host_startup:
print(f"βœ… SPACE_HOST found: {space_host_startup}")
print(f" Runtime URL should be: https://{space_host_startup}.hf.space")
else:
print("ℹ️ SPACE_HOST environment variable not found (running locally?).")
if space_id_startup:
print(f"βœ… SPACE_ID found: {space_id_startup}")
else:
print("ℹ️ SPACE_ID environment variable not found, using default.")
print("-"*70)
demo.launch()