Spaces:

JoachimVC
/

gaia-enhanced-agent

Running

gaia-enhanced-agent / agents /fixed_enhanced_unified_agno_agent.py

GAIA Agent Deployment

Deploy Complete Enhanced GAIA Agent with Phase 1-6 Improvements

9a6a4dc 9 days ago

32.2 kB

	"""
	Fixed GAIA Agent - Addresses Core Evaluation Issues
	Fixes the 5/20 score by addressing:
	1. Answer format enforcement
	2. Tool integration reliability
	3. Response extraction simplification
	4. Proper instruction alignment
	"""

	import os
	import logging
	from typing import Dict, Any, List, Optional, Union
	from pathlib import Path

	from agno.agent import Agent
	from agno.models.mistral import MistralChat

	# Import enhanced response processor
	from utils.response_processor import EnhancedResponseProcessor

	# Import calculator prompt enhancer
	from utils.calculator_prompt_enhancer import CalculatorPromptEnhancer

	# Import enhanced file handler
	from utils.file_handler import (
	EnhancedFileHandler,
	FileType,
	FileFormat,
	ProcessedFile,
	FileInfo,
	process_file,
	validate_file_exists,
	cleanup_temp_files
	)

	# Remove redundant tool selection - Agno handles this naturally

	# Import multimodal tools with enhanced RTL support
	try:
	from .enhanced_rtl_multimodal_agent import EnhancedRTLMultimodalTools
	MULTIMODAL_AVAILABLE = True
	ENHANCED_RTL_AVAILABLE = True
	except ImportError:
	try:
	from enhanced_rtl_multimodal_agent import EnhancedRTLMultimodalTools
	MULTIMODAL_AVAILABLE = True
	ENHANCED_RTL_AVAILABLE = True
	except ImportError:
	# Fallback to standard multimodal tools
	try:
	from .mistral_multimodal_agent import OpenSourceMultimodalTools as EnhancedRTLMultimodalTools
	MULTIMODAL_AVAILABLE = True
	ENHANCED_RTL_AVAILABLE = False
	except ImportError:
	try:
	from mistral_multimodal_agent import OpenSourceMultimodalTools as EnhancedRTLMultimodalTools
	MULTIMODAL_AVAILABLE = True
	ENHANCED_RTL_AVAILABLE = False
	except ImportError:
	EnhancedRTLMultimodalTools = None
	MULTIMODAL_AVAILABLE = False
	ENHANCED_RTL_AVAILABLE = False

	# Load environment variables from .env file
	def load_env_file():
	"""Load environment variables from .env file if it exists."""
	env_file = Path('.env')
	if env_file.exists():
	with open(env_file, 'r') as f:
	for line in f:
	line = line.strip()
	if line and not line.startswith('#') and '=' in line:
	key, value = line.split('=', 1)
	os.environ[key.strip()] = value.strip()

	# Load environment variables at module level
	load_env_file()

	logger = logging.getLogger(__name__)


	class FixedGAIAAgent:
	"""
	Enhanced GAIA Agent with sophisticated response processing.

	Key features:
	1. Enforces "FINAL ANSWER:" format in instructions
	2. Uses enhanced response processor with multi-stage extraction
	3. Simplified tool initialization with better error handling
	4. Advanced response processing with confidence scoring
	5. Semantic analysis and question type classification
	"""

	def __init__(self):
	"""Initialize the fixed GAIA agent."""
	logger.info("🚀 Initializing Fixed GAIA Agent...")

	# Initialize enhanced file handler
	self.file_handler = EnhancedFileHandler()
	logger.info("🗂️ Enhanced file handler initialized")

	# Initialize enhanced response processor
	self.response_processor = EnhancedResponseProcessor()
	logger.info("🧠 Enhanced response processor initialized")

	# Initialize calculator prompt enhancer
	self.prompt_enhancer = CalculatorPromptEnhancer()
	logger.info("🔧 Calculator prompt enhancer initialized")

	# Agno framework handles tool selection naturally - no need for separate selector
	logger.info("🎯 Using Agno's built-in intelligent tool orchestration")

	# Initialize tools with better error handling
	self.tools = self._init_tools_with_validation()

	# Initialize multimodal tools
	self.multimodal_tools = self._init_multimodal_tools()
	if self.multimodal_tools:
	self.tools.extend(self.multimodal_tools.tools)

	# Check for required API key
	self.mistral_api_key = os.getenv("MISTRAL_API_KEY")
	if not self.mistral_api_key:
	logger.error("❌ MISTRAL_API_KEY not found - agent requires this for operation")
	self.agent = None
	self.available = False
	return

	# Create the agent with fixed instructions
	self.agent = self._create_fixed_agent()

	# Set availability flag
	self.available = self.agent is not None

	if self.available:
	logger.info("✅ Fixed GAIA Agent initialized successfully")
	logger.info(f"📊 Available tools: {len(self.tools)}")
	logger.info(f"🗂️ File handler capabilities: {list(self.file_handler.get_supported_formats().keys())}")
	else:
	logger.error("❌ Fixed GAIA Agent initialization failed")

	def _init_tools_with_validation(self) -> List[Any]:
	"""Initialize tools with better validation and error handling."""
	tools = []
	tool_status = {}

	# Core tools that should always work
	core_tools = [
	{
	'name': 'calculator',
	'module': 'agno.tools.calculator',
	'class': 'CalculatorTools',
	'required_env': None,
	'critical': True
	},
	{
	'name': 'python',
	'module': 'agno.tools.python',
	'class': 'PythonTools',
	'required_env': None,
	'critical': True
	},
	]

	# Optional tools - only EXA and Firecrawl need API keys
	optional_tools = [
	{
	'name': 'wikipedia',
	'module': 'agno.tools.wikipedia',
	'class': 'WikipediaTools',
	'required_env': None,
	'critical': False
	},
	{
	'name': 'arxiv',
	'module': 'agno.tools.arxiv',
	'class': 'ArxivTools',
	'required_env': None,
	'critical': False
	},
	{
	'name': 'file',
	'module': 'agno.tools.file',
	'class': 'FileTools',
	'required_env': None,
	'critical': False
	},
	{
	'name': 'shell',
	'module': 'agno.tools.shell',
	'class': 'ShellTools',
	'required_env': None,
	'critical': False
	},
	{
	'name': 'firecrawl',
	'module': 'agno.tools.firecrawl',
	'class': 'FirecrawlTools',
	'required_env': 'FIRECRAWL_API_KEY',
	'critical': False
	},
	{
	'name': 'exa',
	'module': 'agno.tools.exa',
	'class': 'ExaTools',
	'required_env': 'EXA_API_KEY',
	'critical': False
	},
	{
	'name': 'youtube',
	'module': 'agno.tools.youtube',
	'class': 'YouTubeTools',
	'required_env': None,
	'critical': False
	},
	{
	'name': 'video_analysis',
	'module': 'tools.video_analysis_tool',
	'class': 'VideoAnalysisTool',
	'required_env': None,
	'description': 'Video frame extraction and visual analysis for YouTube videos',
	'critical': False
	},
	]

	all_tools = core_tools + optional_tools

	for tool_config in all_tools:
	tool_name = tool_config['name']
	module_path = tool_config['module']
	class_name = tool_config['class']
	required_env = tool_config['required_env']
	is_critical = tool_config['critical']

	try:
	# Check environment requirements
	if required_env and not os.getenv(required_env):
	if is_critical:
	logger.error(f"❌ Critical tool {tool_name} missing {required_env}")
	raise RuntimeError(f"Critical tool {tool_name} requires {required_env}")
	else:
	logger.warning(f"⚠️ Optional tool {tool_name} missing {required_env}")
	tool_status[tool_name] = f"Missing {required_env}"
	continue

	# Import and instantiate the tool
	module = __import__(module_path, fromlist=[class_name])
	tool_class = getattr(module, class_name)

	# Initialize tool with appropriate parameters
	if tool_name == 'exa':
	tool_instance = tool_class(api_key=os.getenv('EXA_API_KEY'))
	elif tool_name == 'firecrawl':
	tool_instance = tool_class(api_key=os.getenv('FIRECRAWL_API_KEY'))
	else:
	tool_instance = tool_class()

	tools.append(tool_instance)
	tool_status[tool_name] = "✅ Available"
	logger.info(f"✅ {class_name} initialized successfully")

	except Exception as e:
	if is_critical:
	logger.error(f"❌ Critical tool {tool_name} failed: {e}")
	raise RuntimeError(f"Critical tool {tool_name} failed to initialize: {e}")
	else:
	logger.warning(f"⚠️ Optional tool {tool_name} failed: {e}")
	tool_status[tool_name] = f"Error: {str(e)[:50]}"

	# Log tool status
	logger.info("📊 Tool Status Summary:")
	for tool_name, status in tool_status.items():
	logger.info(f" {tool_name}: {status}")

	return tools

	def _init_multimodal_tools(self) -> Optional[Any]:
	"""Initialize multimodal tools with error handling."""
	if not MULTIMODAL_AVAILABLE:
	logger.warning("⚠️ Multimodal tools not available")
	return None

	try:
	multimodal_tools = EnhancedRTLMultimodalTools()
	if ENHANCED_RTL_AVAILABLE:
	logger.info("✅ Enhanced RTL multimodal tools initialized")
	else:
	logger.info("✅ Standard multimodal tools initialized (RTL enhancement not available)")
	return multimodal_tools
	except Exception as e:
	logger.warning(f"⚠️ Failed to initialize multimodal tools: {e}")
	return None

	def _create_fixed_agent(self) -> Optional[Agent]:
	"""Create the agent with fixed instructions and configuration."""
	try:
	# Create Mistral model
	model = MistralChat(
	api_key=self.mistral_api_key,
	id="mistral-large-latest",
	temperature=0.0, # Zero temperature for consistent answers
	max_tokens=1000 # Shorter responses
	)

	# Create agent with fixed instructions
	agent = Agent(
	model=model,
	tools=self.tools,
	instructions=self._get_fixed_instructions(),
	show_tool_calls=True, # Enable tool call visibility for debugging
	markdown=True, # Enable markdown formatting
	debug_mode=True # Enable debug mode to see tool usage
	)

	logger.info(f"✅ Fixed GAIA Agent created with {len(self.tools)} tools")
	return agent

	except Exception as e:
	logger.error(f"❌ Failed to create fixed agent: {e}")
	return None

	def _get_fixed_instructions(self) -> str:
	"""Get fixed instructions that enforce proper answer format."""
	return """You are a GAIA evaluation agent. Your job is to answer questions accurately using available tools.

	🚨 CRITICAL RESPONSE FORMAT REQUIREMENTS 🚨

	YOU MUST ALWAYS END YOUR RESPONSE WITH:
	FINAL ANSWER: [your answer here]

	⚠️ NEVER INCLUDE:
	- JSON objects like {"name": "search_exa", "arguments": {"query": "..."}}
	- Tool call descriptions
	- Complex explanations
	- Markdown formatting
	- Multiple sentences

	✅ FORMATTING RULES:
	- Numbers: No commas (write "1234" not "1,234")
	- No units unless specifically requested
	- Single words or short phrases only
	- Clean, simple text only

	✅ CORRECT EXAMPLES:
	Question: "What is 25 * 17?"
	FINAL ANSWER: 425

	Question: "What is the capital of France?"
	FINAL ANSWER: Paris

	Question: "List three colors"
	FINAL ANSWER: blue, green, red

	❌ WRONG EXAMPLES (NEVER DO THIS):
	{"name": "search_exa", "arguments": {"query": "Stargate SG-1"}}
	The search tool returned information about...
	I need to use the calculator tool to compute...

	🔧 TOOL USAGE CRITICAL FIXES:
	- Use calculator for basic math operations
	- For Python calculations, ALWAYS use this pattern:
	* Store result in a variable (e.g., result = calculation)
	* Use variable_to_return parameter to get the value
	* Example: run_python_code("result = sum(range(1, 11))", variable_to_return="result")
	- For complex calculations requiring Python:
	* Write: result = your_calculation
	* Then use variable_to_return="result" to get the answer
	- Use web search tools for current information
	- Use wikipedia only when explicitly mentioned
	- Always verify your answer before responding

	🔧 PYTHON TOOL USAGE EXAMPLES:
	- For "What is 2^8?": run_python_code("result = 2**8", variable_to_return="result")
	- For "Sum 1 to 10": run_python_code("result = sum(range(1, 11))", variable_to_return="result")
	- For "25 * 17": run_python_code("result = 25 * 17", variable_to_return="result")

	🔧 SEARCH TOOL OPTIMIZATION:
	- For bird species: search_wikipedia("bird species diversity world") or search_exa("total bird species world 2024")
	- For artist discography: search_exa("Mercedes Sosa discography albums 2000-2009")
	- For factual counting: search_wikipedia first, then search_exa if needed
	- For current events: search_exa with specific queries

	🎥 YOUTUBE & VIDEO ANALYSIS TOOL USAGE:
	- For YouTube URLs with AUDIO/SPEECH questions: Use YouTube tool to get transcription
	- For YouTube URLs with VISUAL questions (counting objects, analyzing what's visible): Use video_analysis tool
	- Video analysis tool extracts frames and uses computer vision for visual questions
	- Examples:
	* "What does person say in video?" → Use YouTube tool (audio/transcript)
	* "How many birds are visible?" → Use video_analysis tool (visual analysis)
	* "Count objects in video" → Use video_analysis tool (visual analysis)

	🔄 IMAGE ANALYSIS & ROTATED TEXT RECOGNITION:
	- For images with text questions: Use analyze_image tool with enhanced RTL (rotated text) support
	- The tool can handle text in ALL orientations: normal (0°), rotated 90°, upside down (180°), rotated 270°
	- When analyzing images for text content, be specific about looking for rotated text
	- Examples:
	* "What text is in this image?" → Use analyze_image with question about text in any orientation
	* "Read the text in this document" → Use analyze_image with emphasis on rotated text detection
	* "What numbers do you see?" → Use analyze_image to find numbers regardless of orientation
	- The enhanced tool automatically tries multiple orientations for better text recognition

	� FINAL REMINDER:
	- Use tools to get information
	- Process the information
	- Extract the simple answer
	- End with "FINAL ANSWER: [simple answer]"
	- NEVER show tool calls or JSON in your final response

	This format is MANDATORY for evaluation success."""

	def __call__(self, question: str, files: Optional[List[Union[str, dict]]] = None) -> str:
	"""Process a question using the fixed agent with optional file attachments."""
	if not self.available:
	logger.error("❌ Fixed GAIA Agent not available")
	return "unknown"

	try:
	logger.info(f"🤔 Processing question: {question[:100]}...")

	# Process any attached files
	processed_files = []
	if files:
	logger.info(f"📎 Processing {len(files)} attached files...")
	processed_files = self._process_attached_files(files)

	# Enhance question with file information - let Agno handle tool selection
	enhanced_question = self._enhance_question_with_files(question, processed_files)

	# Enhance question for exponentiation operations
	final_question = self.prompt_enhancer.enhance_prompt_for_exponentiation(enhanced_question)
	if final_question != enhanced_question:
	logger.info("🔧 Enhanced question for exponentiation operation")

	# Use agent to process the final enhanced question
	response = self.agent.run(final_question)

	# Extract response content
	if hasattr(response, 'content'):
	raw_answer = response.content
	elif isinstance(response, str):
	raw_answer = response
	else:
	raw_answer = str(response)

	# Process the response using enhanced processor
	extraction_result = self.response_processor.process_response(raw_answer, question)
	formatted_answer = extraction_result.answer

	# Log processing details
	logger.info(f"🔍 Extraction strategy: {extraction_result.strategy.value}")
	logger.info(f"📊 Confidence: {extraction_result.confidence:.2f}")
	if hasattr(extraction_result, 'validation_issues') and extraction_result.validation_issues:
	logger.warning(f"⚠️ Validation issues: {', '.join(extraction_result.validation_issues)}")

	logger.info(f"✅ Question processed")
	logger.info(f"📝 Raw answer: {raw_answer[:200]}...")
	logger.info(f"🎯 Final answer: '{formatted_answer}'")

	return formatted_answer

	except Exception as e:
	logger.error(f"❌ Error processing question: {e}")
	return "unknown"
	finally:
	# Clean up any temporary files
	self._cleanup_processed_files()

	def _process_attached_files(self, files: List[Union[str, dict]]) -> List[ProcessedFile]:
	"""
	Process attached files for analysis.

	Args:
	files: List of file paths, file info dicts, or base64 content

	Returns:
	List of ProcessedFile objects
	"""
	processed_files = []

	for file_input in files:
	try:
	logger.info(f"📄 Processing file: {str(file_input)[:100]}...")

	# Process the file using enhanced file handler
	processed_file = self.file_handler.process_file_input(file_input)

	if processed_file.info.error:
	logger.warning(f"⚠️ File processing warning: {processed_file.info.error}")
	else:
	logger.info(f"✅ File processed: {processed_file.info.file_type.value} ({processed_file.info.file_format.value})")

	processed_files.append(processed_file)

	except Exception as e:
	logger.error(f"❌ Error processing file {file_input}: {e}")
	# Create error file info
	error_file = ProcessedFile(
	info=FileInfo(
	path=str(file_input),
	exists=False,
	file_type=FileType.UNKNOWN,
	file_format=FileFormat.UNKNOWN,
	size_bytes=None,
	mime_type=None,
	is_base64=False,
	error=f"Processing failed: {e}",
	metadata={}
	),
	content=None,
	temp_path=None,
	cleanup_required=False
	)
	processed_files.append(error_file)

	return processed_files

	def _enhance_question_with_files(self, question: str, processed_files: List[ProcessedFile]) -> str:
	"""
	Enhance the question with file information for better processing.

	Args:
	question: Original question
	processed_files: List of processed files

	Returns:
	Enhanced question with file context
	"""
	if not processed_files:
	return question

	enhanced_question = f"Question: {question}\n\nAttached Files:\n"

	for i, processed_file in enumerate(processed_files, 1):
	file_info = processed_file.info

	# Add file information with proper path resolution
	if file_info.exists and not file_info.error:
	# Use the resolved absolute path for file access
	resolved_path = file_info.path

	if file_info.file_type == FileType.IMAGE:
	enhanced_question += f"File {i}: image ({file_info.file_format.value}), {file_info.size_bytes} bytes\n"
	enhanced_question += f"Image file path: {resolved_path}\n"
	enhanced_question += f"Use analyze_image tool with file_path: '{resolved_path}' to analyze this image.\n"

	elif file_info.file_type == FileType.AUDIO:
	enhanced_question += f"File {i}: audio ({file_info.file_format.value}), {file_info.size_bytes} bytes\n"
	enhanced_question += f"Audio file path: {resolved_path}\n"
	enhanced_question += f"Use transcribe_audio tool with file_path: '{resolved_path}' to transcribe this audio.\n"

	elif file_info.file_type == FileType.DOCUMENT:
	enhanced_question += f"File {i}: document ({file_info.file_format.value}), {file_info.size_bytes} bytes\n"
	enhanced_question += f"Document file path: {resolved_path}\n"
	enhanced_question += f"Use analyze_document tool with file_path: '{resolved_path}' to analyze this document.\n"

	else:
	# For other file types, just provide basic info
	enhanced_question += f"File {i}: {file_info.file_type.value} ({file_info.file_format.value}), {file_info.size_bytes} bytes\n"
	enhanced_question += f"File available at: {resolved_path}\n"

	else:
	# File has errors
	enhanced_question += f"File {i}: {file_info.file_type.value} (ERROR: {file_info.error})\n"

	enhanced_question += f"\nPlease analyze the question in the context of the provided files and give a precise answer.\n"
	enhanced_question += f"IMPORTANT: Use the exact file paths provided above when calling analysis tools.\n"

	# Add specific instructions for exponentiation if detected
	if any(op in question.lower() for op in ['power', '^', '**', 'exponent', 'raised to']):
	enhanced_question += "\nIMPORTANT: This question involves exponentiation. Please use Python code to calculate the result accurately.\n"
	enhanced_question += "For exponentiation operations:\n"
	enhanced_question += "- Use the operator in Python (e.g., 28 for 2 to the power of 8)\n"
	enhanced_question += "- Do NOT use the ^ symbol as it means XOR in Python, not exponentiation\n"
	enhanced_question += "- Use the pow() function if needed (e.g., pow(2, 8))\n"
	enhanced_question += "\nPlease calculate this step by step using Python to ensure accuracy.\n"

	# Continue to add file content processing
	if not processed_files:
	return question

	# Build file context
	file_context = []
	multimodal_data = {}

	for i, processed_file in enumerate(processed_files):
	file_info = processed_file.info

	if file_info.error:
	file_context.append(f"File {i+1}: ERROR - {file_info.error}")
	continue

	# Add basic file information
	file_desc = f"File {i+1}: {file_info.file_type.value} ({file_info.file_format.value})"
	if file_info.size_bytes:
	file_desc += f", {file_info.size_bytes} bytes"

	file_context.append(file_desc)

	# Handle different file types for multimodal processing
	if file_info.file_type == FileType.IMAGE and self.multimodal_tools:
	try:
	# Use multimodal tools for image analysis
	image_path = processed_file.temp_path or file_info.path
	analysis = self.multimodal_tools.analyze_image(image_path, question)
	file_context.append(f"Image Analysis: {analysis}")
	multimodal_data[f'image_{i}'] = image_path
	except Exception as e:
	logger.warning(f"Image analysis failed: {e}")
	file_context.append(f"Image Analysis: Failed - {e}")

	elif file_info.file_type == FileType.AUDIO and self.multimodal_tools:
	try:
	# Use multimodal tools for audio transcription
	audio_path = processed_file.temp_path or file_info.path
	transcription = self.multimodal_tools.transcribe_audio(audio_path)
	file_context.append(f"Audio Transcription: {transcription}")
	multimodal_data[f'audio_{i}'] = audio_path
	except Exception as e:
	logger.warning(f"Audio transcription failed: {e}")
	file_context.append(f"Audio Transcription: Failed - {e}")

	elif file_info.file_type == FileType.DOCUMENT:
	try:
	# Read document content
	if processed_file.content:
	if file_info.file_format == FileFormat.TXT:
	content = processed_file.content.decode('utf-8', errors='ignore')
	file_context.append(f"Document Content: {content[:1000]}...")
	else:
	file_context.append(f"Document: {file_info.file_format.value} format detected")
	except Exception as e:
	logger.warning(f"Document reading failed: {e}")
	file_context.append(f"Document: Could not read content - {e}")

	elif file_info.file_type == FileType.DATA:
	try:
	# Handle data files
	if file_info.file_format == FileFormat.JSON and processed_file.content:
	import json
	data = json.loads(processed_file.content.decode('utf-8'))
	file_context.append(f"JSON Data: {str(data)[:500]}...")
	elif file_info.file_format == FileFormat.CSV and processed_file.content:
	content = processed_file.content.decode('utf-8', errors='ignore')
	lines = content.split('\n')[:10] # First 10 lines
	file_context.append(f"CSV Data (first 10 lines):\n{chr(10).join(lines)}")
	elif file_info.file_format == FileFormat.XLSX and processed_file.content:
	# For Excel files, use the file handler's Excel reading capability
	excel_content = self.file_handler.read_excel_file(file_info.path)
	if excel_content:
	lines = excel_content.split('\n')[:10] # First 10 lines of CSV conversion
	file_context.append(f"Excel Data (converted to CSV, first 10 lines):\n{chr(10).join(lines)}")
	else:
	file_context.append(f"Excel file detected but could not read content: {file_info.path}")
	else:
	file_context.append(f"Data File: {file_info.file_format.value} format")
	except Exception as e:
	logger.warning(f"Data file processing failed: {e}")
	file_context.append(f"Data File: Could not process - {e}")

	elif file_info.file_type == FileType.CODE:
	try:
	# Read code content
	if processed_file.content:
	content = processed_file.content.decode('utf-8', errors='ignore')
	file_context.append(f"Code Content ({file_info.file_format.value}): {content[:1000]}...")
	except Exception as e:
	logger.warning(f"Code file reading failed: {e}")
	file_context.append(f"Code File: Could not read - {e}")

	# Add file content to the existing enhanced question
	if file_context:
	enhanced_question += f"\n\nFile Content:\n{chr(10).join(file_context)}\n"

	logger.info(f"📝 Enhanced question with {len(processed_files)} files")
	return enhanced_question

	def _cleanup_processed_files(self):
	"""Clean up any temporary files created during processing."""
	try:
	self.file_handler.cleanup_temp_files()
	logger.info("🗑️ Temporary files cleaned up")
	except Exception as e:
	logger.warning(f"⚠️ Cleanup warning: {e}")

	def get_processor_statistics(self) -> Dict[str, Any]:
	"""Get enhanced response processor statistics."""
	if hasattr(self, 'response_processor'):
	return self.response_processor.get_statistics()
	return {}

	def get_tool_status(self) -> Dict[str, Any]:
	"""Get the current status of all tools."""
	multimodal_status = {}
	if hasattr(self, 'multimodal_tools') and self.multimodal_tools:
	multimodal_status = self.multimodal_tools.get_capabilities_status()

	file_handler_status = {}
	if hasattr(self, 'file_handler'):
	file_handler_status = {
	'supported_formats': {
	file_type.value: [fmt.value for fmt in formats]
	for file_type, formats in self.file_handler.get_supported_formats().items()
	},
	'base_paths': self.file_handler.base_paths,
	'temp_files_count': len(self.file_handler.temp_files)
	}

	return {
	'available': self.available,
	'tools_count': len(self.tools) if self.tools else 0,
	'mistral_api_key_present': bool(self.mistral_api_key),
	'agent_created': self.agent is not None,
	'multimodal_tools_available': MULTIMODAL_AVAILABLE,
	'multimodal_status': multimodal_status,
	'file_handler_status': file_handler_status
	}


	# Create global agent instance
	fixed_gaia_agent = FixedGAIAAgent()


	def process_question(question: str) -> str:
	"""Process a question using the fixed GAIA agent."""
	return fixed_gaia_agent(question)


	def get_agent_status() -> Dict[str, Any]:
	"""Get the current status of the fixed GAIA agent."""
	return fixed_gaia_agent.get_tool_status()