Spaces:

AnalysisWithMSR
/

SEO

Sleeping

App Files Files Community

AnalysisWithMSR commited on Dec 14, 2024

Commit

b12cec2

verified ·

1 Parent(s): 04621a9

Update app.py

Browse files

Files changed (1) hide show

app.py +15 -4

app.py CHANGED Viewed

@@ -18,6 +18,12 @@ youtube_api_key = os.getenv("YOUTUBE_API_KEY")
 openai_api_key = os.getenv("OPENAI_API_KEY")
 openai.api_key = openai_api_key
 def extract_video_id(url):
     """Extracts the video ID from a YouTube URL."""
     try:
@@ -51,6 +57,7 @@ def get_video_duration(video_id, api_key):
         return None
 def download_and_transcribe_with_whisper(youtube_url):
     try:
         with tempfile.TemporaryDirectory() as temp_dir:
             temp_audio_file = os.path.join(temp_dir, "audio.mp3")
@@ -58,8 +65,11 @@ def download_and_transcribe_with_whisper(youtube_url):
             ydl_opts = {
                 'format': 'bestaudio/best',
                 'outtmpl': temp_audio_file,
-                'extractaudio': True,
-                'audioquality': 1,
             }
             # Download audio using yt-dlp
@@ -132,6 +142,7 @@ def summarize_text_huggingface(text):
     return " ".join(summaries)
 def generate_optimized_content(summarized_transcript):
     prompt = f"""
     Analyze the following summarized YouTube video transcript and:
     1. Extract the top 10 keywords.
@@ -163,11 +174,11 @@ def generate_optimized_content(summarized_transcript):
     except Exception as e:
         return {"error": str(e)}
 def process_video(youtube_url):
     transcript = get_transcript(youtube_url)
     if not transcript:
-        return "Could not fetch the transcript. Please try another video."
     summary = summarize_text_huggingface(transcript)
     optimized_content = generate_optimized_content(summary)

 openai_api_key = os.getenv("OPENAI_API_KEY")
 openai.api_key = openai_api_key
+if not youtube_api_key:
+    raise ValueError("YOUTUBE_API_KEY is not set. Please set it as an environment variable.")
+if not openai_api_key:
+    raise ValueError("OPENAI_API_KEY is not set. Please set it as an environment variable.")
 def extract_video_id(url):
     """Extracts the video ID from a YouTube URL."""
     try:
         return None
 def download_and_transcribe_with_whisper(youtube_url):
+    """Downloads audio from YouTube and transcribes it using Whisper."""
     try:
         with tempfile.TemporaryDirectory() as temp_dir:
             temp_audio_file = os.path.join(temp_dir, "audio.mp3")
             ydl_opts = {
                 'format': 'bestaudio/best',
                 'outtmpl': temp_audio_file,
+                'postprocessors': [{
+                    'key': 'FFmpegExtractAudio',
+                    'preferredcodec': 'mp3',
+                    'preferredquality': '192',
+                }],
             }
             # Download audio using yt-dlp
     return " ".join(summaries)
 def generate_optimized_content(summarized_transcript):
+    """Generates optimized video metadata using OpenAI's GPT model."""
     prompt = f"""
     Analyze the following summarized YouTube video transcript and:
     1. Extract the top 10 keywords.
     except Exception as e:
         return {"error": str(e)}
 def process_video(youtube_url):
+    """Processes a YouTube URL to generate optimized metadata."""
     transcript = get_transcript(youtube_url)
     if not transcript:
+        return {"error": "Could not fetch the transcript. Please try another video."}
     summary = summarize_text_huggingface(transcript)
     optimized_content = generate_optimized_content(summary)