Spaces:

Hamed744
/

Ttspro

Running

App Files Files Community

Hamed744 commited on Jun 5

Commit

e4d0150

verified ·

1 Parent(s): 41e2093

Update app.py

Browse files

Files changed (1) hide show

app.py +430 -345

app.py CHANGED Viewed

@@ -1,3 +1,4 @@
 import base64
 import mimetypes
 import os
@@ -5,28 +6,36 @@ import re
 import struct
 import time
 import zipfile
-import shutil
 from google import genai
 from google.genai import types
 try:
     from pydub import AudioSegment
     PYDUB_AVAILABLE = True
 except ImportError:
     PYDUB_AVAILABLE = False
-    print("⚠️ pydub در دسترس نیست. فایل‌های صوتی به صورت جداگانه ذخیره می‌شوند.")
-import gradio as gr
-# --- Helper functions ---
-def save_binary_file(file_name, data):
-    output_dir = "outputs"
-    os.makedirs(output_dir, exist_ok=True)
-    full_file_path = os.path.join(output_dir, file_name)
-    with open(full_file_path, "wb") as f:
-        f.write(data)
-    print(f"✅ فایل در مسیر زیر ذخیره شد: {full_file_path}")
-    return full_file_path
 def convert_to_wav(audio_data: bytes, mime_type: str) -> bytes:
     parameters = parse_audio_mime_type(mime_type)
@@ -38,6 +47,7 @@ def convert_to_wav(audio_data: bytes, mime_type: str) -> bytes:
     block_align = num_channels * bytes_per_sample
     byte_rate = sample_rate * block_align
     chunk_size = 36 + data_size
     header = struct.pack(
         "<4sI4s4sIHHIIHH4sI",
         b"RIFF", chunk_size, b"WAVE", b"fmt ", 16, 1, num_channels,
@@ -47,7 +57,7 @@ def convert_to_wav(audio_data: bytes, mime_type: str) -> bytes:
 def parse_audio_mime_type(mime_type: str) -> dict[str, int | None]:
     bits_per_sample = 16
-    rate = 24000
     parts = mime_type.split(";")
     for param in parts:
         param = param.strip()
@@ -55,397 +65,472 @@ def parse_audio_mime_type(mime_type: str) -> dict[str, int | None]:
             try:
                 rate_str = param.split("=", 1)[1]
                 rate = int(rate_str)
-            except (ValueError, IndexError): pass
-        elif param.lower().startswith("audio/l"):
             try:
-                bits_str = param.split("L", 1)[1]
-                bits_per_sample = int(re.match(r'\d+', bits_str).group(0))
-            except (ValueError, IndexError, AttributeError):
                 pass
     return {"bits_per_sample": bits_per_sample, "rate": rate}
-def load_text_from_gradio_file(file_obj):
-    if file_obj is None: return ""
-    try:
-        with open(file_obj.name, 'r', encoding='utf-8') as f:
-            content = f.read().strip()
-        print(f"📖 متن بارگذاری شده: {len(content)} کاراکتر")
-        return content
-    except Exception as e:
-        print(f"❌ خطا در خواندن فایل: {e}")
-        return ""
 def smart_text_split(text, max_size=3800):
-    if len(text) <= max_size: return [text]
     chunks = []
     current_chunk = ""
-    processed_text = re.sub(r'\s+', ' ', text).strip()
-    sentences = re.split(r'(?<=[.!?؟])\s+', processed_text)
     for sentence in sentences:
-        if not sentence.strip(): continue
-        if len(current_chunk) + (1 if current_chunk else 0) + len(sentence) > max_size:
             if current_chunk:
                 chunks.append(current_chunk.strip())
-            current_chunk = ""
-            while len(sentence) > max_size:
-                split_at = sentence[:max_size].rfind(' ')
-                if split_at <= 0 or split_at < max_size // 3:
-                    split_at = max_size
-                chunks.append(sentence[:split_at].strip())
-                sentence = sentence[split_at:].strip()
-            current_chunk = sentence
         else:
-            if current_chunk:
-                current_chunk += " " + sentence
-            else:
-                current_chunk = sentence
-    if current_chunk.strip():
         chunks.append(current_chunk.strip())
-    return [c for c in chunks if c]
-def merge_audio_files_func(file_paths, output_path):
     if not PYDUB_AVAILABLE:
-        return None, "خطا: کتابخانه pydub برای ادغام فایل‌ها در دسترس نیست."
-    if not file_paths: return None, "خطا: هیچ فایلی برای ادغام وجود ندارد."
-    output_dir = os.path.dirname(output_path)
-    if output_dir: os.makedirs(output_dir, exist_ok=True)
     try:
-        log_messages = [f"🔗 در حال ادغام {len(file_paths)} فایل صوتی..."]
         combined = AudioSegment.empty()
-        valid_files_merged = 0
         for i, file_path in enumerate(file_paths):
-            if os.path.exists(file_path) and os.path.getsize(file_path) > 0:
-                try:
-                    log_messages.append(f"📎 اضافه کردن فایل {i+1}: {os.path.basename(file_path)}")
-                    audio = AudioSegment.from_file(file_path)
-                    combined += audio
-                    if i < len(file_paths) - 1: combined += AudioSegment.silent(duration=200)
-                    valid_files_merged += 1
-                except Exception as e:
-                    log_messages.append(f"⚠️ خطا در خواندن یا اضافه کردن فایل {os.path.basename(file_path)}: {e}")
             else:
-                log_messages.append(f"⚠️ فایل پیدا نشد یا خالی است: {os.path.basename(file_path)}")
-        if valid_files_merged == 0:
-             return None, "\n".join(log_messages) + "\n❌ هیچ فایل معتبری برای ادغام پیدا نشد."
-        combined.export(output_path, format="wav")
-        log_messages.append(f"✅ فایل ادغام شده ذخیره شد: {os.path.basename(output_path)}")
-        return output_path, "\n".join(log_messages)
     except Exception as e:
-        return None, f"❌ خطا در ادغام فایل‌ها: {e}"
-def create_zip_file(file_paths, zip_name_base):
-    output_dir = "outputs"
-    os.makedirs(output_dir, exist_ok=True)
-    zip_path = os.path.join(output_dir, f"{zip_name_base}.zip")
     try:
-        with zipfile.ZipFile(zip_path, 'w') as zipf:
             for file_path in file_paths:
                 if os.path.exists(file_path):
                     zipf.write(file_path, os.path.basename(file_path))
-        return zip_path, f"📦 فایل ZIP ایجاد شد: {os.path.basename(zip_path)}"
     except Exception as e:
-        return None, f"❌ خطا در ایجاد فایل ZIP: {e}"
-def cleanup_temp_files(files_to_delete):
-    if not files_to_delete: return
-    for f_path in files_to_delete:
-        if f_path and os.path.exists(f_path):
-            try:
-                os.remove(f_path)
-            except Exception as e:
-                print(f"⚠️ خطا در حذف فایل {f_path}: {e}")
-# --- Main generation function for Gradio ---
-def generate_audio_gradio(
-    use_file_input, text_file_obj, text_to_speak, speech_prompt,
-    selected_voice, output_filename_base, model_name, temperature,
-    max_chunk_size, sleep_between_requests, merge_audio_files, delete_partial_files,
-    progress=gr.Progress(track_tqdm=True)
 ):
-    log_messages = ["🚀 شروع فرآیند تبدیل متن به گفتار...\n"]
-    output_main_dir = "outputs"
-    os.makedirs(output_main_dir, exist_ok=True)
-    if os.path.exists(output_main_dir) and output_filename_base:
-        for item in os.listdir(output_main_dir):
-            if item.startswith(output_filename_base):
-                try:
-                    item_path = os.path.join(output_main_dir, item)
-                    if os.path.isfile(item_path) or os.path.islink(item_path): os.unlink(item_path)
-                    elif os.path.isdir(item_path): shutil.rmtree(item_path)
-                    log_messages.append(f"🗑️ فایل قدیمی '{item}' حذف شد.")
-                except Exception as e:
-                    log_messages.append(f"⚠️ خطا در حذف فایل قدیمی '{item}': {e}")
-    text_input = load_text_from_gradio_file(text_file_obj) if use_file_input else text_to_speak
-    if use_file_input:
-        log_messages.append(f"📁 حالت فایل فعال است.")
-        if text_file_obj is None:
-            log_messages.append("❌ خطا: هیچ فایلی آپلود نشده است.")
-            return gr.update(visible=False), gr.update(visible=False), "\n".join(log_messages)
-        if not text_input:
-            log_messages.append("❌ خطا: متن استخراج شده از فایل خالی است.")
-            return gr.update(visible=False), gr.update(visible=False), "\n".join(log_messages)
-        log_messages.append(f"✅ متن از '{os.path.basename(text_file_obj.name)}' با موفقیت بارگذاری شد.")
-    else:
-        log_messages.append("⌨️ حالت ورودی دستی فعال است.")
-    if not text_input or not text_input.strip():
-        log_messages.append("❌ خطا: متن ورودی برای تبدیل به گفتار خالی است.")
-        return gr.update(visible=False), gr.update(visible=False), "\n".join(log_messages)
-    api_key_env = os.environ.get("GEMINI_API_KEY") or os.environ.get("GOOGLE_API_KEY")
-    if not api_key_env:
-        log_messages.append("❌ خطا: کلید API جمینای (GEMINI_API_KEY یا GOOGLE_API_KEY) در Secrets پیدا نشد.")
-        log_messages.append("لطفاً کلید API خود را در بخش Settings -> Secrets این Space تنظیم کنید.")
-        return gr.update(visible=False), gr.update(visible=False), "\n".join(log_messages)
-    log_messages.append("🔑 کلید API از Hugging Face Secrets بارگذاری شد (کتابخانه باید آن را به طور خودکار بخواند).")
-    text_chunks = smart_text_split(text_input, int(max_chunk_size))
-    if not text_chunks:
-        log_messages.append("❌ خطا: پس از تقسیم‌بندی، هیچ قطعه متنی برای پردازش وجود ندارد.")
-        return gr.update(visible=False), gr.update(visible=False), "\n".join(log_messages)
-    log_messages.append(f"📊 متن به {len(text_chunks)} قطعه تقسیم شد:")
-    for i_chunk, chunk_content in enumerate(text_chunks): log_messages.append(f"  📝 قطعه {i_chunk+1}: {len(chunk_content)} کاراکتر - '{chunk_content[:50].replace(chr(10), ' ')}...'")
-    generated_files = []
-    total_chunks = len(text_chunks)
     try:
-        log_messages.append(f"🛠️ در حال آماده‌سازی مدل جمینای ({model_name})...")
-        generative_model_client = genai.GenerativeModel(model_name=model_name)
-        log_messages.append(f"✅ مدل جمینای ({model_name}) با موفقیت آماده شد.")
     except Exception as e:
-        log_messages.append(f"❌ خطا در آماده‌سازی مدل جمینای ({model_name}): {type(e).__name__} - {e}")
-        if "API_KEY_INVALID" in str(e).upper() or "API key" in str(e).lower() or "credential" in str(e).lower() or "permission_denied" in str(e).lower():
-            log_messages.append("   🔑 مشکل احتمالی با کلید API یا دسترسی‌ها. مطمئن شوید GEMINI_API_KEY (یا GOOGLE_API_KEY) در Secrets صحیح و فعال است و به مدل دسترسی دارید.")
-        import traceback
-        log_messages.append(f"   Traceback: {traceback.format_exc()}")
-        return gr.update(visible=False), gr.update(visible=False), "\n".join(log_messages)
-    for i, chunk_text in enumerate(progress.tqdm(text_chunks, desc="تولید قطعات صوتی")):
-        current_log = [f"\n🔊 تولید صدا برای قطعه {i+1}/{total_chunks}..."]
-        final_text_for_api = f"{speech_prompt}\n{chunk_text}" if speech_prompt and speech_prompt.strip() else chunk_text
-        current_log.append(f"   متن ارسالی به API (اول 50 کاراکتر): '{final_text_for_api[:50].replace(chr(10), ' ')}...'")
         try:
-            contents_for_api = [types.Content(role="user", parts=[types.Part.from_text(text=final_text_for_api)])]
-            gen_config = types.GenerateContentConfig(
-                temperature=float(temperature),
-                response_modalities=["audio"],
-                speech_config=types.SpeechConfig(
-                    voice_config=types.VoiceConfig(
-                        prebuilt_voice_config=types.PrebuiltVoiceConfig(
-                            voice_name=selected_voice
-                        )
-                    )
-                )
-            )
-            response = generative_model_client.generate_content(
-                contents=contents_for_api,
-                generation_config=gen_config
             )
-            audio_data_buffer = b""
-            final_mime_type = "audio/wav"
-            audio_part_found = False
-            if response.candidates and response.candidates[0].content and response.candidates[0].content.parts:
-                for part in response.candidates[0].content.parts:
-                    if part.inline_data and part.inline_data.mime_type and part.inline_data.mime_type.startswith("audio/"):
-                        audio_data_buffer = part.inline_data.data
-                        final_mime_type = part.inline_data.mime_type
-                        audio_part_found = True
-                        current_log.append(f"   دریافت داده صوتی با MIME-type: {final_mime_type}")
-                        break
-            if not audio_part_found:
-                current_log.append(f"   ⚠️ داده صوتی برای قطعه {i+1} در پاسخ API یافت نشد.")
-                if hasattr(response, 'text') and response.text:
-                    current_log.append(f"   متن پاسخ API: {response.text}")
-                if hasattr(response, 'prompt_feedback') and response.prompt_feedback and response.prompt_feedback.block_reason:
-                    current_log.append(f"   مسدودسازی پرامپت: {response.prompt_feedback.block_reason.name} - {response.prompt_feedback.block_reason_message}")
-                current_log.append(f"   پاسخ کامل (اول 200 کاراکتر): {str(response)[:200]}")
-            if audio_data_buffer:
-                file_extension = mimetypes.guess_extension(final_mime_type)
-                if not file_extension or file_extension.lower() == ".bin":
-                    file_extension = ".wav"
-                processed_data_buffer = audio_data_buffer
-                chunk_filename_base = f"{output_filename_base}_part_{i+1:03d}"
-                generated_file_path = save_binary_file(f"{chunk_filename_base}{file_extension}", processed_data_buffer)
-                generated_files.append(generated_file_path)
-                current_log.append(f"✅ قطعه {i+1} تولید و ذخیره شد: {os.path.basename(generated_file_path)}")
         except Exception as e:
-            current_log.append(f"❌ خطا در تولید قطعه {i+1}: {type(e).__name__} - {e}")
-            if "API key" in str(e).lower() or "permission_denied" in str(e).lower() or "quota" in str(e).lower():
-                 current_log.append("   🔑 مشکل احتمالی با کلید API، دسترسی به مدل، یا محدودیت‌های استفاده. لطفاً تنظیمات Secrets و مدل انتخابی را بررسی کنید و از محدودیت‌های حساب خود مطلع باشید.")
-            import traceback
-            current_log.append(f"   Traceback: {traceback.format_exc()}")
-        log_messages.extend(current_log)
-        if i < total_chunks - 1 and float(sleep_between_requests) > 0:
-            log_messages.append(f"⏱️ انتظار {float(sleep_between_requests)} ثانیه...")
-            time.sleep(float(sleep_between_requests))
     if not generated_files:
-        log_messages.append("\n❌ هیچ فایل صوتی تولید نشد!")
-        return gr.update(value=None, visible=False), gr.update(value=None, visible=False), "\n".join(log_messages)
-    log_messages.append(f"\n🎉 {len(generated_files)} فایل صوتی با موفقیت تولید شد!")
-    final_audio_output_path = None
-    zip_file_output_path = None
-    audio_output_visible = False
-    file_output_visible = False
-    if merge_audio_files and len(generated_files) > 1:
-        merged_filename_path = os.path.join(output_main_dir, f"{output_filename_base}_merged.wav")
-        merged_path, merge_log = merge_audio_files_func(generated_files, merged_filename_path)
-        log_messages.append(merge_log or "")
-        if merged_path:
-            final_audio_output_path = merged_path
-            audio_output_visible = True
-            file_output_visible = True
-            if delete_partial_files:
-                cleanup_temp_files([f for f in generated_files if f != final_audio_output_path])
-        else:
-            zip_file_output_path, zip_log = create_zip_file(generated_files, f"{output_filename_base}_all_parts")
-            log_messages.append(zip_log or "")
-            if zip_file_output_path: file_output_visible = True
-            if generated_files: final_audio_output_path = generated_files[0]; audio_output_visible = True
     elif len(generated_files) == 1:
-        final_audio_output_path = generated_files[0]
-        audio_output_visible = True
-        file_output_visible = True
-    else:
-        if not merge_audio_files and len(generated_files) > 1:
-            zip_file_output_path, zip_log = create_zip_file(generated_files, f"{output_filename_base}_all_parts")
-            log_messages.append(zip_log or "")
-            if zip_file_output_path: file_output_visible = True
-            if generated_files: final_audio_output_path = generated_files[0]; audio_output_visible = True
-        elif generated_files:
-            final_audio_output_path = generated_files[0]; audio_output_visible = True; file_output_visible = True
-    primary_audio_to_play = final_audio_output_path
-    downloadable_file = zip_file_output_path if zip_file_output_path else final_audio_output_path
-    return (
-        gr.update(value=primary_audio_to_play, visible=audio_output_visible),
-        gr.update(value=downloadable_file, visible=file_output_visible),
-        "\n".join(log_messages)
-    )
-# --- Gradio Interface ---
-css = """
-body { font-family: 'Tahoma', 'Arial', sans-serif; }
-.gradio-container { max-width: 850px !important; margin: auto !important; padding-top: 1.5rem; }
-footer { display: none !important; } .gr-button { min-width: 180px; }
-h1 { text-align: center; color: #2E7D32; margin-bottom: 0.5rem;}
-.gr-input, .gr-output {border-radius: 8px !important;}
-.small-info {font-size: 0.85em; color: #555; margin-top: -5px; margin-bottom: 10px;}
-.output-header { margin-top: 20px; }
-"""
-speaker_choices = ["Achird", "Zubenelgenubi", "Vindemiatrix", "Sadachbia", "Sadaltager", "Sulafat", "Laomedeia", "Achernar", "Alnilam", "Schedar", "Gacrux", "Pulcherrima", "Umbriel", "Algieba", "Despina", "Erinome", "Algenib", "Rasalthgeti", "Orus", "Aoede", "Callirrhoe", "Autonoe", "Enceladus", "Iapetus", "Zephyr", "Puck", "Charon", "Kore", "Fenrir", "Leda"]
-# Using model names EXACTLY from the user's FIRST Colab code block:
-# #@param ["gemini-2.5-flash-preview-tts", "gemini-2.5-pro-preview-tts"]
-model_choices = ["gemini-2.5-flash-preview-tts", "gemini-2.5-pro-preview-tts"] # <<<< THIS IS NOW CORRECTED TO "2.5"
-selected_model_default = model_choices[0]
-aigolden_logo_encoded = "Q3JlYXRlIGJ5IDogYWlnb2xkZW4="
-try: aigolden_logo_decoded = base64.b64decode(aigolden_logo_encoded.encode()).decode()
-except: aigolden_logo_decoded = "Created by: aigolden"
-with gr.Blocks(css=css, theme=gr.themes.Soft(primary_hue="green", secondary_hue="lime")) as demo:
-    gr.Markdown(f"<h1>تبدیل متن به گفتار با Gemini گوگل</h1>")
-    gr.Markdown(f"<p style='text-align: center; color: gray; margin-bottom: 20px;'>{aigolden_logo_decoded}</p>")
-    with gr.Accordion("⚠️ راهنما و نکات مهم", open=False):
-        gr.Markdown("- **کلید API:** کلید API خود از Google AI Studio را در بخش `Settings` -> `Secrets` این Space با نام `GEMINI_API_KEY` (یا `GOOGLE_API_KEY`) ذخیره کنید.")
-        gr.Markdown("- **مدل‌ها:** مطمئن شوید مدل‌های انتخابی (`gemini-X.X-...-tts`) برای حساب شما فعال و قابل دسترس هستند.")
-        gr.Markdown("- **محدودیت‌ها:** API گوگل ممکن است محدودیت درخواست (quota) داشته باشد. در صورت خطا، صبر کرده و دوباره تلاش کنید، یا فاصله زمانی بین درخواست‌ها را افزایش دهید.")
-        gr.Markdown("- **فایل‌های حجیم:** پردازش متن‌های بسیار طولانی ممکن است زمان‌بر باشد و به محدودیت‌های منابع در Spaces برخورد کند.")
-        gr.Markdown("- **پاکسازی:** فایل‌های قدیمی با نام مشابه قبل از هر اجرای جدید پاک می‌شوند.")
-    with gr.Row():
-        with gr.Column(scale=3):
-            gr.Markdown("### ⚙️ تنظیمات اصلی")
-            use_file_input_cb = gr.Checkbox(label="استفاده از فایل متنی ورودی (.txt)", value=False)
-            gr.Markdown("اگر فعال شود، متن از فایل آپلود شده خوانده می‌شود.", elem_classes="small-info")
-            text_file_upload = gr.File(label="آپلود فایل متنی (.txt)", file_types=[".txt"], visible=False)
-            text_to_speak_input = gr.Textbox(lines=7, label="متن برای تبدیل به گفتار", placeholder="متن خود را اینجا وارد کنید...", visible=True)
-            def toggle_input_method(use_file):
-                return {text_file_upload: gr.update(visible=use_file), text_to_speak_input: gr.update(visible=not use_file)}
-            use_file_input_cb.change(toggle_input_method, inputs=use_file_input_cb, outputs=[text_file_upload, text_to_speak_input])
-            speech_prompt_input = gr.Textbox(label="پرامپت راهنمای سبک گفتار (اختیاری)", placeholder="مثال: از زبان یک یوتوبر پر انرژی و حرفه ای")
-            gr.Markdown("این پرامپت به تنظیم سبک و لحن گفتار کمک می‌کند.", elem_classes="small-info")
-            output_filename_base_input = gr.Textbox(label="نام پایه فایل خروجی (بدون پسوند)", value="gemini_tts_output")
-            gr.Markdown("برای نامگذاری فایل‌های صوتی تولید شده استفاده می‌شود.", elem_classes="small-info")
-        with gr.Column(scale=2):
-            gr.Markdown("### 🗣️ تنظیمات مدل و گوینده")
-            model_name_dd = gr.Dropdown(model_choices, label="انتخاب مدل Gemini TTS", value=selected_model_default)
-            gr.Markdown("مطمئن شوید این مدل‌ها برای TTS بهینه شده و برای شما فعال هستند.", elem_classes="small-info")
-            speaker_voice_dd = gr.Dropdown(speaker_choices, label="انتخاب گوینده", value="Charon")
-            gr.Markdown("گوینده مورد نظر را برای تولید صدا انتخاب کنید.", elem_classes="small-info")
-            temperature_slider = gr.Slider(minimum=0.0, maximum=1.0, step=0.05, value=0.7, label="دمای مدل (Temperature)")
-            gr.Markdown("مقادیر بالاتر = خلاقیت بیشتر، مقادیر پایین‌تر = قابل پیش‌بینی‌تر.", elem_classes="small-info")
-            gr.Markdown("### ✂️ تقسیم‌بندی و خروجی")
-            max_chunk_size_slider = gr.Slider(minimum=1000, maximum=4000, step=100, value=3800, label="حداکثر کاراکتر در هر قطعه")
-            gr.Markdown("متن‌های طولانی به قطعات کوچکتر تقسیم می‌شوند.", elem_classes="small-info")
-            sleep_between_requests_slider = gr.Slider(minimum=1, maximum=30, step=0.5, value=10, label="فاصله زمانی بین درخواست‌ها (ثانیه)")
-            gr.Markdown("برای جلوگیری از خطاهای محدودیت API (quota errors).", elem_classes="small-info")
-            merge_audio_files_cb = gr.Checkbox(label="ادغام فایل‌های صوتی جزئی", value=True)
-            gr.Markdown("ادغام فایل‌های صوتی بخش‌های مختلف متن طولانی در یک فایل WAV.", elem_classes="small-info")
-            delete_partial_files_cb = gr.Checkbox(label="حذف فایل‌های جزئی پس از ادغام", value=True)
-            gr.Markdown("فقط در صورتی اعمال می‌شود که ادغام فایل‌ها فعال و موفق باشد.", elem_classes="small-info")
-    submit_button = gr.Button("🎧 تبدیل متن به گفتار 🎧", variant="primary", scale=1)
-    gr.Markdown("### 🔊 خروجی و گزارش", elem_classes="output-header")
-    with gr.Row():
-        audio_output = gr.Audio(label="فایل صوتی نهایی", type="filepath", visible=False)
-        file_download_output = gr.File(label="دانلود فایل (ادغام شده یا ZIP)", type="filepath", visible=False)
-    status_output = gr.Textbox(label="وضعیت و گزارش‌ها", lines=10, interactive=False, show_copy_button=True)
-    submit_button.click(
-        generate_audio_gradio,
         inputs=[
-            use_file_input_cb, text_file_upload, text_to_speak_input, speech_prompt_input,
-            speaker_voice_dd, output_filename_base_input, model_name_dd, temperature_slider,
-            max_chunk_size_slider, sleep_between_requests_slider, merge_audio_files_cb, delete_partial_files_cb
         ],
-        outputs=[audio_output, file_download_output, status_output]
     )
 if __name__ == "__main__":
-    if not os.path.exists("outputs"): os.makedirs("outputs")
-    demo.launch(debug=True)

+import gradio as gr
 import base64
 import mimetypes
 import os
 import struct
 import time
 import zipfile
 from google import genai
 from google.genai import types
 try:
     from pydub import AudioSegment
     PYDUB_AVAILABLE = True
 except ImportError:
     PYDUB_AVAILABLE = False
+# --- Constants ---
+SPEAKER_VOICES = [
+    "Achird", "Zubenelgenubi", "Vindemiatrix", "Sadachbia", "Sadaltager",
+    "Sulafat", "Laomedeia", "Achernar", "Alnilam", "Schedar", "Gacrux",
+    "Pulcherrima", "Umbriel", "Algieba", "Despina", "Erinome", "Algenib",
+    "Rasalthgeti", "Orus", "Aoede", "Callirrhoe", "Autonoe", "Enceladus",
+    "Iapetus", "Zephyr", "Puck", "Charon", "Kore", "Fenrir", "Leda"
+]
+MODEL_NAMES = ["gemini-2.5-flash-preview-tts", "gemini-2.5-pro-preview-tts"]
+# --- Helper functions (Adapted for Gradio logging) ---
+def save_binary_file(file_name, data, log_messages_list):
+    try:
+        with open(file_name, "wb") as f:
+            f.write(data)
+        log_messages_list.append(f"✅ فایل در مسیر زیر ذخیره شد: {file_name}")
+        return file_name
+    except Exception as e:
+        log_messages_list.append(f"❌ خطا در ذخیره فایل {file_name}: {e}")
+        return None
 def convert_to_wav(audio_data: bytes, mime_type: str) -> bytes:
     parameters = parse_audio_mime_type(mime_type)
     block_align = num_channels * bytes_per_sample
     byte_rate = sample_rate * block_align
     chunk_size = 36 + data_size
     header = struct.pack(
         "<4sI4s4sIHHIIHH4sI",
         b"RIFF", chunk_size, b"WAVE", b"fmt ", 16, 1, num_channels,
 def parse_audio_mime_type(mime_type: str) -> dict[str, int | None]:
     bits_per_sample = 16
+    rate = 24000
     parts = mime_type.split(";")
     for param in parts:
         param = param.strip()
             try:
                 rate_str = param.split("=", 1)[1]
                 rate = int(rate_str)
+            except (ValueError, IndexError):
+                pass
+        elif param.startswith("audio/L"):
             try:
+                bits_per_sample = int(param.split("L", 1)[1])
+            except (ValueError, IndexError):
                 pass
     return {"bits_per_sample": bits_per_sample, "rate": rate}
 def smart_text_split(text, max_size=3800):
+    if len(text) <= max_size:
+        return [text]
     chunks = []
     current_chunk = ""
+    sentences = re.split(r'(?<=[.!?])\s+', text)
     for sentence in sentences:
+        if len(current_chunk) + len(sentence) + 1 > max_size:
             if current_chunk:
                 chunks.append(current_chunk.strip())
+            current_chunk = sentence
+            # If a single sentence is too long, split it by words/chars
+            if len(current_chunk) > max_size:
+                words = current_chunk.split()
+                temp_word_chunk = ""
+                for word in words:
+                    if len(temp_word_chunk) + len(word) + 1 > max_size:
+                        if temp_word_chunk: chunks.append(temp_word_chunk.strip())
+                        temp_word_chunk = word
+                        while len(temp_word_chunk) > max_size: # Force split very long words
+                            chunks.append(temp_word_chunk[:max_size])
+                            temp_word_chunk = temp_word_chunk[max_size:]
+                    else:
+                        temp_word_chunk += (" " if temp_word_chunk else "") + word
+                if temp_word_chunk: chunks.append(temp_word_chunk.strip())
+                current_chunk = "" # Reset current_chunk as it was processed
         else:
+            current_chunk += (" " if current_chunk else "") + sentence
+    if current_chunk:
         chunks.append(current_chunk.strip())
+    return [c for c in chunks if c] # Ensure no empty chunks
+def merge_audio_files_func(file_paths, output_path, log_messages_list):
     if not PYDUB_AVAILABLE:
+        log_messages_list.append("❌ pydub در دسترس نیست. نمی‌توان فایل‌ها را ادغام کرد.")
+        return False
     try:
+        log_messages_list.append(f"🔗 در حال ادغام {len(file_paths)} فایل صوتی...")
         combined = AudioSegment.empty()
         for i, file_path in enumerate(file_paths):
+            if os.path.exists(file_path):
+                log_messages_list.append(f"📎 اضافه کردن فایل {i+1}: {file_path}")
+                audio = AudioSegment.from_file(file_path)
+                combined += audio
+                if i < len(file_paths) - 1: # Add short silence between segments
+                    combined += AudioSegment.silent(duration=100) # 100ms silence
             else:
+                log_messages_list.append(f"⚠️ فایل پیدا نشد: {file_path}")
+        combined.export(output_path, format="wav")
+        log_messages_list.append(f"✅ فایل ادغام شده ذخیره شد: {output_path}")
+        return True
     except Exception as e:
+        log_messages_list.append(f"❌ خطا در ادغام فایل‌ها: {e}")
+        return False
+def create_zip_file(file_paths, zip_name, log_messages_list):
     try:
+        with zipfile.ZipFile(zip_name, 'w') as zipf:
             for file_path in file_paths:
                 if os.path.exists(file_path):
                     zipf.write(file_path, os.path.basename(file_path))
+        log_messages_list.append(f"📦 فایل ZIP ایجاد شد: {zip_name}")
+        return True
     except Exception as e:
+        log_messages_list.append(f"❌ خطا در ایجاد فایل ZIP: {e}")
+        return False
+# --- Main generation function (Adapted for Gradio) ---
+def core_generate_audio(
+    text_input, prompt_input, selected_voice, output_base_name,
+    model, temperature_val,
+    max_chunk, sleep_time, merge_files, delete_partials,
+    log_messages_list  # Pass the list to append logs
 ):
+    log_messages_list.append("🚀 شروع فرآیند تبدیل متن به گفتار...")
+    # API Key Retrieval
+    api_key = os.environ.get("GEMINI_API_KEY")
+    if not api_key:
+        log_messages_list.append("❌ خطا: کلید API جمینای (GEMINI_API_KEY) در Secrets این Space تنظیم نشده است.")
+        log_messages_list.append("لطفاً به تنظیمات Space رفته و یک Secret با نام GEMINI_API_KEY و مقدار کلید خود ایجاد کنید.")
+        return None, None # No audio path, no download path
+    # Initialize GenAI Client
     try:
+        log_messages_list.append("🛠️ در حال ایجاد کلاینت جمینای...")
+        # os.environ["GEMINI_API_KEY"] = api_key # Already set if from secrets
+        client = genai.Client(api_key=api_key) # Pass api_key directly
+        log_messages_list.append("✅ کلاینت جمینای با موفقیت ایجاد شد.")
     except Exception as e:
+        log_messages_list.append(f"❌ خطا در ایجاد کلاینت جمینای: {e}")
+        log_messages_list.append("لطفاً از صحت کلید API خود اطمینان حاصل کنید.")
+        return None, None
+    # Validate Text Input (already done in wrapper, but good to double check)
+    if not text_input or text_input.strip() == "":
+        log_messages_list.append("❌ خطا: متن ورودی برای تبدیل به گفتار خالی است.")
+        return None, None
+    # Split text into chunks
+    text_chunks = smart_text_split(text_input, max_chunk)
+    log_messages_list.append(f"📊 متن به {len(text_chunks)} قطعه تقسیم شد.")
+    for i, chunk in enumerate(text_chunks):
+        log_messages_list.append(f"📝 قطعه {i+1}: {len(chunk)} کاراکتر")
+        if len(chunk) == 0: # Safety check from smart_text_split
+            log_messages_list.append(f"⚠️ هشدار: قطعه {i+1} خالی است و نادیده گرفته می‌شود.")
+    text_chunks = [c for c in text_chunks if c] # Filter out empty chunks again
+    if not text_chunks:
+        log_messages_list.append("❌ خطا: پس از تقسیم‌بندی، هیچ قطعه متنی برای پردازش وجود ندارد.")
+        return None, None
+    generated_files = []
+    # Ensure output directory exists (optional, can write to current dir)
+    # output_dir = "outputs"
+    # os.makedirs(output_dir, exist_ok=True)
+    for i, chunk in enumerate(text_chunks):
+        log_messages_list.append(f"\n🔊 تولید صدا برای قطعه {i+1}/{len(text_chunks)}...")
+        final_text = f'"{prompt_input}"\n{chunk}' if prompt_input and prompt_input.strip() else chunk
+        contents = [types.Content(role="user", parts=[types.Part.from_text(text=final_text)])]
+        generate_content_config = types.GenerateContentConfig(
+            temperature=temperature_val,
+            response_modalities=["audio"],
+            speech_config=types.SpeechConfig(
+                voice_config=types.VoiceConfig(
+                    prebuilt_voice_config=types.PrebuiltVoiceConfig(voice_name=selected_voice)
+                )
+            ),
+        )
+        current_chunk_filename_base = f"{output_base_name}_part{i+1:03d}"
+        # current_chunk_filename_base = os.path.join(output_dir, f"{output_base_name}_part{i+1:03d}")
         try:
+            # Using generate_content, not stream, for simplicity with single audio part expected
+            response = client.models.generate_content(
+                model=model,
+                contents=contents,
+                config=generate_content_config,
             )
+            if (response.candidates and response.candidates[0].content and
+                response.candidates[0].content.parts and
+                response.candidates[0].content.parts[0].inline_data):
+                inline_data = response.candidates[0].content.parts[0].inline_data
+                data_buffer = inline_data.data
+                file_extension = mimetypes.guess_extension(inline_data.mime_type)
+                if file_extension is None or "binary" in inline_data.mime_type: # Fallback for generic mime types
+                    file_extension = ".wav"
+                    # Assuming Gemini TTS API now more consistently returns audio/* mimetypes
+                    # but if it's audio/L16; rate=24000, convert_to_wav is needed
+                    if "audio/L" in inline_data.mime_type: # Needs WAV header
+                         data_buffer = convert_to_wav(data_buffer, inline_data.mime_type)
+                    # If it's already audio/wav or audio/mpeg, it might be fine.
+                    # Forcing .wav for consistency as pydub handles WAV well.
+                    # If Gemini sends actual WAV, convert_to_wav might not be strictly needed
+                    # but better safe than sorry if mime is generic.
+                generated_file_path = save_binary_file(f"{current_chunk_filename_base}{file_extension}", data_buffer, log_messages_list)
+                if generated_file_path:
+                    generated_files.append(generated_file_path)
+                    log_messages_list.append(f"✅ قطعه {i+1} تولید شد: {generated_file_path}")
+            elif response.text: # If API returns text (e.g. error or info)
+                 log_messages_list.append(f"ℹ️ پیام متنی از API برای قطعه {i+1}: {response.text}")
+                 if "rate limit" in response.text.lower():
+                    log_messages_list.append(f"⏳ به نظر میرسد به محدودیت تعداد درخواست API رسیده‌اید. لطفاً چند دقیقه صبر کنید و دوباره امتحان کنید، یا فاصله زمانی بین درخواست‌ها را افزایش دهید.")
+            else: # No audio, no text
+                log_messages_list.append(f"⚠️ پاسخ API برای قطعه {i+1} حاوی داده صوتی یا پیام متنی نبود.")
+        except types.generation_types.BlockedPromptException as bpe:
+            log_messages_list.append(f"❌ محتوای پرامپت برای قطعه {i+1} مسدود شد: {bpe}")
+            log_messages_list.append("لطفاً متن ورودی یا پرامپت سبک گفتار را بررسی و اصلاح کنید.")
+            continue # Skip to next chunk
+        except types.generation_types.StopCandidateException as sce:
+            log_messages_list.append(f"❌ تولید محتوا برای قطعه {i+1} به دلیل نامشخصی متوقف شد: {sce}")
+            continue
         except Exception as e:
+            log_messages_list.append(f"❌ خطا در تولید قطعه {i+1}: {e}")
+            # Specific check for common API errors
+            if "API key not valid" in str(e):
+                log_messages_list.append("خطای کلید API. لطفاً از معتبر بودن کلید و تنظیم صحیح آن در Secrets مطمئن شوید.")
+            elif "resource has been exhausted" in str(e).lower() or "quota" in str(e).lower():
+                 log_messages_list.append("به نظر میرسد محدودیت استفاده از API (Quota) شما تمام شده است.")
+            continue # Skip to next chunk
+        if i < len(text_chunks) - 1 and len(text_chunks) > 1 : # Only sleep if there are more chunks
+            log_messages_list.append(f"⏱️ انتظار {sleep_time} ثانیه...")
+            time.sleep(sleep_time)
     if not generated_files:
+        log_messages_list.append("❌ هیچ فایل صوتی تولید نشد!")
+        return None, None
+    log_messages_list.append(f"\n🎉 {len(generated_files)} فایل صوتی با موفقیت تولید شد!")
+    playback_file = None
+    download_file = None
+    if merge_files and len(generated_files) > 1:
+        if not PYDUB_AVAILABLE:
+            log_messages_list.append("⚠️ pydub برای ادغام در دسترس نیست. فایل‌ها به صورت جداگانه ارائه می‌شوند.")
+            # Offer zip of parts if pydub not available for merging
+            zip_filename = f"{output_base_name}_all_parts.zip"
+            if create_zip_file(generated_files, zip_filename, log_messages_list):
+                download_file = zip_filename
+            playback_file = generated_files[0] # Play first part
+        else:
+            merged_filename = f"{output_base_name}_merged.wav"
+            # merged_filename = os.path.join(output_dir, f"{output_base_name}_merged.wav")
+            if merge_audio_files_func(generated_files, merged_filename, log_messages_list):
+                playback_file = merged_filename
+                download_file = merged_filename
+                log_messages_list.append(f"🎵 فایل نهایی ادغام شده: {merged_filename}")
+                if delete_partials:
+                    for file_path in generated_files:
+                        try:
+                            if file_path != merged_filename: # Don't delete the merged file itself if it was in generated_files
+                                os.remove(file_path)
+                                log_messages_list.append(f"🗑️ فایل جزئی حذف شد: {file_path}")
+                        except Exception as e:
+                            log_messages_list.append(f"⚠️ خطا در حذف فایل جزئی {file_path}: {e}")
+            else:
+                log_messages_list.append("⚠️ ادغام ممکن نبود. فایل‌های جداگانه حفظ شدند.")
+                # Fallback to zip if merging failed
+                zip_filename = f"{output_base_name}_all_parts.zip"
+                # zip_filename = os.path.join(output_dir, f"{output_base_name}_all_parts.zip")
+                if create_zip_file(generated_files, zip_filename, log_messages_list):
+                    download_file = zip_filename
+                playback_file = generated_files[0] # Play first part
     elif len(generated_files) == 1:
+        playback_file = generated_files[0]
+        download_file = generated_files[0]
+    else: # Multiple files, no merge requested
+        zip_filename = f"{output_base_name}_all_parts.zip"
+        # zip_filename = os.path.join(output_dir, f"{output_base_name}_all_parts.zip")
+        if create_zip_file(generated_files, zip_filename, log_messages_list):
+            download_file = zip_filename
+        playback_file = generated_files[0] # Play first part
+    if playback_file and not os.path.exists(playback_file):
+        log_messages_list.append(f"⚠️ فایل پخش {playback_file} وجود ندارد!")
+        playback_file = None
+    if download_file and not os.path.exists(download_file):
+        log_messages_list.append(f"⚠️ فایل دانلود {download_file} وجود ندارد!")
+        download_file = None
+    return playback_file, download_file
+# --- Gradio Interface Function ---
+def gradio_tts_interface(
+    use_file_input, uploaded_file, text_to_speak,
+    speech_prompt, speaker_voice, output_filename_base,
+    model_name, temperature,
+    max_chunk_size, sleep_between_requests,
+    merge_audio_files, delete_partial_files,
+    progress=gr.Progress(track_tqdm=True)
+):
+    log_messages = [] # Initialize list for logs for this run
+    # Determine actual text input
+    actual_text_input = ""
+    if use_file_input:
+        if uploaded_file is not None:
+            try:
+                with open(uploaded_file.name, 'r', encoding='utf-8') as f:
+                    actual_text_input = f.read().strip()
+                log_messages.append(f"✅ متن از فایل '{os.path.basename(uploaded_file.name)}' بارگذاری شد: {len(actual_text_input)} کاراکتر.")
+                log_messages.append(f"📝 نمونه متن فایل: '{actual_text_input[:100]}{'...' if len(actual_text_input) > 100 else ''}'")
+                if not actual_text_input:
+                    log_messages.append("❌ خطا: فایل آپلود شده خالی است.")
+                    return None, None, "\n".join(log_messages)
+            except Exception as e:
+                log_messages.append(f"❌ خطا در خواندن فایل آپلود شده: {e}")
+                return None, None, "\n".join(log_messages)
+        else:
+            log_messages.append("❌ خطا: گزینه 'استفاده از فایل ورودی' انتخاب شده اما هیچ فایلی آپلود نشده است.")
+            return None, None, "\n".join(log_messages)
+    else:
+        actual_text_input = text_to_speak
+        if not actual_text_input or not actual_text_input.strip():
+            log_messages.append("❌ خطا: متن ورودی برای تبدیل به گفتار خالی است. لطفاً متنی را وارد کنید یا گزینه فایل را فعال کنید.")
+            return None, None, "\n".join(log_messages)
+        log_messages.append(f"📖 متن ورودی دستی: {len(actual_text_input)} کاراکتر")
+        log_messages.append(f"📝 نمونه متن ورودی: '{actual_text_input[:100]}{'...' if len(actual_text_input) > 100 else ''}'")
+    if not PYDUB_AVAILABLE:
+        log_messages.append("⚠️ کتابخانه pydub در دسترس نیست. امکان ادغام فایل‌های صوتی وجود نخواهد داشت و فایل‌های صوتی به صورت جداگانه (در صورت وجود چند بخش) در یک فایل ZIP ارائه می‌شوند.")
+        merge_audio_files = False # Force disable merge if pydub is not available
+    # Call the core generation logic
+    playback_path, download_path = core_generate_audio(
+        actual_text_input,
+        speech_prompt,
+        speaker_voice,
+        output_filename_base if output_filename_base else "gemini_tts_output",
+        model_name,
+        temperature,
+        max_chunk_size,
+        sleep_between_requests,
+        merge_audio_files,
+        delete_partial_files,
+        log_messages # Pass the list
+    )
+    log_output = "\n".join(log_messages)
+    # Ensure paths are valid before returning
+    valid_playback_path = playback_path if playback_path and os.path.exists(playback_path) else None
+    valid_download_path = download_path if download_path and os.path.exists(download_path) else None
+    if not valid_playback_path and not valid_download_path and not actual_text_input:
+         # Avoid error message if it was just an empty input from the start
+        pass
+    elif not valid_playback_path and not valid_download_path :
+        log_output += "\n🛑 هیچ فایل صوتی برای پخش یا دانلود در دسترس نیست."
+    return valid_playback_path, valid_download_path, log_output
+# --- Gradio UI Definition ---
+css = """
+body { font-family: 'Arial', sans-serif; }
+.gradio-container { max-width: 800px !important; margin: auto !important; }
+footer { display: none !important; }
+.gr-button { background-color: #007bff !important; color: white !important; }
+.gr-button:hover { background-color: #0056b3 !important; }
+#output_audio .gallery { display: none !important; } /* Hide gallery view for audio if it appears */
+#download_file_output .gallery { display: none !important; } /* Hide gallery view for file if it appears */
+"""
+with gr.Blocks(css=css, theme=gr.themes.Soft()) as demo:
+    gr.Markdown("## 🔊 تبدیل متن به گفتار با Gemini API")
+    gr.Markdown("ساخته شده بر اساس کد کولب توسط: [aigolden](https://github.com/aigolden)") # Assuming aigolden is a GitHub user or similar
+    gr.Markdown("---")
+    gr.Markdown(
+        "**راهنما:** برای استفاده از این ابزار، ابتدا باید کلید API جمینای خود را در بخش **Secrets** این Space در Hugging Face اضافه کنید.\n"
+        "1. به صفحه Space خود بروید.\n"
+        "2. روی 'Settings' کلیک کنید.\n"
+        "3. در بخش 'Repository secrets'، روی 'New secret' کلیک کنید.\n"
+        "4. در فیلد 'Name'، عبارت `GEMINI_API_KEY` را وارد کنید.\n"
+        "5. در فیلد 'Value'، کلید API جمینای خود را وارد کنید و 'Save secret' را بزنید.\n"
+        "پس از تنظیم Secret، می‌توانید از این ابزار استفاده کنید."
+    )
+    gr.Markdown("---")
+    with gr.Row():
+        with gr.Column(scale=2):
+            gr.Markdown("###  تنظیمات ورودی و پرامپت")
+            use_file_input_cb = gr.Checkbox(label="📄 استفاده از فایل متنی ورودی", value=False)
+            # Conditional visibility for text_to_speak_tb vs uploaded_file_input
+            # Gradio handles this by just having both and user interaction defines which is used via the wrapper
+            uploaded_file_input = gr.File(label="📂 آپلود فایل متنی (فقط شامل متن اصلی)", file_types=['.txt'])
+            text_to_speak_tb = gr.Textbox(
+                label="📝 متن ورودی (اگر گزینه فایل فعال نیست)",
+                placeholder="متن مورد نظر برای تبدیل به گفتار را اینجا وارد کنید...",
+                lines=7,
+                value="سلام دنیا! این یک آزمایش برای تبدیل متن به گفتار با استفاده از مدل جمینای است."
+            )
+            speech_prompt_tb = gr.Textbox(
+                label="🗣️ پرامپت برای تنظیم سبک گفتار",
+                placeholder="مثال: از زبان یک یوتوبر پر انرژی و حرفه ای",
+                value="به زبان یک گوینده حرفه‌ای و آرام صحبت کن."
+            )
+        with gr.Column(scale=1):
+            gr.Markdown("### تنظیمات مدل و خروجی")
+            model_name_dd = gr.Dropdown(
+                MODEL_NAMES, label="🤖 انتخاب مدل", value="gemini-2.5-flash-preview-tts"
+            )
+            speaker_voice_dd = gr.Dropdown(
+                SPEAKER_VOICES, label="🎤 انتخاب گوینده", value="Charon"
+            )
+            temperature_slider = gr.Slider(
+                minimum=0, maximum=2, step=0.05, value=1.0, label="🌡️ دمای مدل (تنوع خروجی)"
+            )
+            output_filename_base_tb = gr.Textbox(
+                label="📛 نام پایه فایل خروجی (بدون پسوند)", value="gemini_tts_output"
+            )
+    gr.Markdown("---")
+    gr.Markdown("### تنظیمات پیشرفته")
+    with gr.Row():
+        max_chunk_size_slider = gr.Slider(
+            minimum=2000, maximum=4000, step=100, value=3800, label="📏 حداکثر کاراکتر در هر قطعه"
+        )
+        sleep_between_requests_slider = gr.Slider(
+            minimum=5, maximum=20, step=0.5, value=14, label="⏱️ فاصله زمانی بین درخواست‌ها (ثانیه)"
+        ) # Increased min sleep a bit
+    with gr.Row():
+        merge_audio_files_cb = gr.Checkbox(label="🔗 ادغام فایل‌های صوتی در یک فایل", value=True)
+        delete_partial_files_cb = gr.Checkbox(label="🗑️ حذف فایل‌های جزئی پس از ادغام (اگر ادغام فعال باشد)", value=False)
+    gr.Markdown("---")
+    generate_button = gr.Button("🎙️ تولید صدا", variant="primary")
+    gr.Markdown("---")
+    gr.Markdown("### 🎧 خروجی صوتی و دانلود 📥")
+    with gr.Row():
+        output_audio = gr.Audio(label="🔊 فایل صوتی تولید شده", elem_id="output_audio")
+        download_file_output = gr.File(label="💾 دانلود فایل نهایی (WAV یا ZIP)", elem_id="download_file_output")
+    gr.Markdown("### 📜 لاگ‌ها و پیام‌ها")
+    logs_output_tb = gr.Textbox(label=" ", lines=10, interactive=False, autoscroll=True)
+    # Connect button to function
+    generate_button.click(
+        fn=gradio_tts_interface,
+        inputs=[
+            use_file_input_cb, uploaded_file_input, text_to_speak_tb,
+            speech_prompt_tb, speaker_voice_dd, output_filename_base_tb,
+            model_name_dd, temperature_slider,
+            max_chunk_size_slider, sleep_between_requests_slider,
+            merge_audio_files_cb, delete_partial_files_cb
+        ],
+        outputs=[output_audio, download_file_output, logs_output_tb]
+    )
+    # Example texts
+    gr.Examples(
+        examples=[
+            [False, None, "سلام، این یک تست کوتاه است.", "یک صدای دوستانه و واضح.", "Charon", "gemini_tts_output", "gemini-2.5-flash-preview-tts", 0.9, 3800, 12, True, False],
+            [False, None, "به دنیای هوش مصنوعی خوش آمدید. امیدو��رم از این ابزار لذت ببرید.", "با هیجان و انرژی صحبت کن.", "Zephyr", "ai_voice_test", "gemini-2.5-flash-preview-tts", 1.1, 3000, 10, True, True],
+        ],
         inputs=[
+            use_file_input_cb, uploaded_file_input, text_to_speak_tb,
+            speech_prompt_tb, speaker_voice_dd, output_filename_base_tb,
+            model_name_dd, temperature_slider,
+            max_chunk_size_slider, sleep_between_requests_slider,
+            merge_audio_files_cb, delete_partial_files_cb
         ],
+        outputs=[output_audio, download_file_output, logs_output_tb], # outputs are optional for examples
+        fn=gradio_tts_interface, # function to call for examples
+        cache_examples=False # Set to True if you want to precompute and cache example outputs
     )
+    gr.Markdown(
+        "<div style='text-align: center; margin-top: 20px; font-size: 0.9em; color: grey;'>"
+        "این ابزار از API شرکت Google Gemini برای تبدیل متن به گفتار استفاده می‌کند. "
+        "لطفاً به محدودیت‌های استفاده و شرایط خدمات Gemini API توجه فرمایید."
+        "</div>"
+    )
 if __name__ == "__main__":
+    demo.launch(debug=True) # debug=True for local testing