Final_Assignment_Template

Sleeping

App Files Files Community

dalybuilds commited on Jul 19

Commit

6d169a1

verified ·

1 Parent(s): df2d975

Update app.py

Browse files

Files changed (1) hide show

app.py +14 -10

app.py CHANGED Viewed

@@ -5,15 +5,16 @@ import pandas as pd
 from io import BytesIO
 import re
 import subprocess
 # --- Tool-specific Imports ---
 from pytube import YouTube
-# --- LangChain & Groq Imports ---
 from groq import Groq
 from langchain_groq import ChatGroq
 from langchain.agents import AgentExecutor, create_tool_calling_agent
-from langchain_tavily import TavilySearchResults
 from langchain_core.prompts import ChatPromptTemplate
 from langchain.tools import Tool
@@ -40,13 +41,13 @@ def transcribe_audio_file(task_id: str) -> str:
     except Exception as e:
         return f"Error during audio file transcription: {e}"
-# --- Tool Definition: Video Transcription (using FFmpeg) ---
 def transcribe_youtube_video(video_url: str) -> str:
     """
     Downloads a YouTube video from a URL, extracts its audio using FFmpeg, and transcribes it.
     Use this tool ONLY when a question provides a youtube.com URL.
     """
-    print(f"Tool 'transcribe_youtube_video' (ffmpeg) called with URL: {video_url}")
     video_path, audio_path = None, None
     try:
         os.makedirs(TEMP_DIR, exist_ok=True)
@@ -54,8 +55,10 @@ def transcribe_youtube_video(video_url: str) -> str:
         stream = yt.streams.filter(only_audio=True).first()
         video_path = stream.download(output_path=TEMP_DIR)
         audio_path = os.path.join(TEMP_DIR, "output.mp3")
-        command = ["ffmpeg", "-i", video_path, "-y", "-q:a", "0", "-map", "a", audio_path]
-        subprocess.run(command, check=True, capture_output=True, text=True)
         client = Groq(api_key=os.getenv("GROQ_API_KEY"))
         with open(audio_path, "rb") as audio_file:
             transcription = client.audio.transcriptions.create(file=audio_file, model="whisper-large-v3", response_format="text")
@@ -71,13 +74,14 @@ class LangChainAgent:
     def __init__(self, groq_api_key: str, tavily_api_key: str):
         self.llm = ChatGroq(model_name="llama3-70b-8192", groq_api_key=groq_api_key, temperature=0.0)
         self.tools = [
-            TavilySearchResults(name="web_search", max_results=3, tavily_api_key=tavily_api_key, description="A search engine for finding up-to-date information on the internet."),
             Tool(name="audio_file_transcriber", func=transcribe_audio_file, description="Use this for questions mentioning an audio file (.mp3, recording). Input MUST be the task_id."),
             Tool(name="youtube_video_transcriber", func=transcribe_youtube_video, description="Use this for questions with a youtube.com URL. Input MUST be the URL."),
         ]
         prompt = ChatPromptTemplate.from_messages([
             ("system", (
-                "You are a powerful problem-solving agent. You have access to a web search tool, an audio file transcriber, and a YouTube video transcriber.\n\n"
                 "**REASONING PROCESS:**\n"
                 "1.  **Analyze the question:** Determine if a tool is needed. Is it a general knowledge question, or does it mention an audio file or a YouTube URL?\n"
                 "2.  **Select ONE tool based on the question:**\n"
@@ -157,7 +161,7 @@ with gr.Blocks() as demo:
 if __name__ == "__main__":
     print("\n" + "-"*30 + " App Starting " + "-"*30)
-    for key in ["GROQ_API_KEY", "TAVILY_API_KEY"]:
         print(f"✅ {key} secret is set." if os.getenv(key) else f"⚠️ WARNING: {key} secret is not set.")
     print("-"*(60 + len(" App Starting ")) + "\n")
-    demo.launch(debug=True, share=False)

 from io import BytesIO
 import re
 import subprocess
+import ffmpeg
 # --- Tool-specific Imports ---
 from pytube import YouTube
+# --- LangChain & Dependency Imports ---
 from groq import Groq
 from langchain_groq import ChatGroq
 from langchain.agents import AgentExecutor, create_tool_calling_agent
+from langchain_tavily import TavilySearch
 from langchain_core.prompts import ChatPromptTemplate
 from langchain.tools import Tool
     except Exception as e:
         return f"Error during audio file transcription: {e}"
+# --- Tool Definition: Video Transcription (using ffmpeg-python) ---
 def transcribe_youtube_video(video_url: str) -> str:
     """
     Downloads a YouTube video from a URL, extracts its audio using FFmpeg, and transcribes it.
     Use this tool ONLY when a question provides a youtube.com URL.
     """
+    print(f"Tool 'transcribe_youtube_video' (ffmpeg-python) called with URL: {video_url}")
     video_path, audio_path = None, None
     try:
         os.makedirs(TEMP_DIR, exist_ok=True)
         stream = yt.streams.filter(only_audio=True).first()
         video_path = stream.download(output_path=TEMP_DIR)
         audio_path = os.path.join(TEMP_DIR, "output.mp3")
+        # Use ffmpeg-python instead of subprocess
+        stream = ffmpeg.input(video_path)
+        stream = ffmpeg.output(stream, audio_path, q=0, map='a', y='y')
+        ffmpeg.run(stream)
         client = Groq(api_key=os.getenv("GROQ_API_KEY"))
         with open(audio_path, "rb") as audio_file:
             transcription = client.audio.transcriptions.create(file=audio_file, model="whisper-large-v3", response_format="text")
     def __init__(self, groq_api_key: str, tavily_api_key: str):
         self.llm = ChatGroq(model_name="llama3-70b-8192", groq_api_key=groq_api_key, temperature=0.0)
         self.tools = [
+            TavilySearch(name="web_search", max_results=3, tavily_api_key=tavily_api_key, description="A search engine for finding up-to-date information on the internet."),
             Tool(name="audio_file_transcriber", func=transcribe_audio_file, description="Use this for questions mentioning an audio file (.mp3, recording). Input MUST be the task_id."),
             Tool(name="youtube_video_transcriber", func=transcribe_youtube_video, description="Use this for questions with a youtube.com URL. Input MUST be the URL."),
         ]
         prompt = ChatPromptTemplate.from_messages([
             ("system", (
+                "You are a powerful problem-solving agent. Your goal is to answer the user's question accurately. "
+                "You have access to a web search tool, an audio file transcriber, and a YouTube video transcriber.\n\n"
                 "**REASONING PROCESS:**\n"
                 "1.  **Analyze the question:** Determine if a tool is needed. Is it a general knowledge question, or does it mention an audio file or a YouTube URL?\n"
                 "2.  **Select ONE tool based on the question:**\n"
 if __name__ == "__main__":
     print("\n" + "-"*30 + " App Starting " + "-"*30)
+    for key in ["GROQ_API_KEY", "TAVILY_API_KEY", "SPACE_ID"]:
         print(f"✅ {key} secret is set." if os.getenv(key) else f"⚠️ WARNING: {key} secret is not set.")
     print("-"*(60 + len(" App Starting ")) + "\n")
+    demo.launch(debug=True, share=False)