Spaces:

Hamed744
/

Ttspro

Running

App Files Files Community

Hamed744 commited on Jun 5

Commit

3b52ce7

verified ·

1 Parent(s): 47095d4

Update app.py

Browse files

Files changed (1) hide show

app.py +507 -248

app.py CHANGED Viewed

@@ -1,25 +1,75 @@
 import gradio as gr
-import base64
-import mimetypes
 import os
-import re
-import struct
 import time
-import zipfile
-from google import genai
-from google.genai import types
 import logging
-logging.basicConfig(level=logging.INFO, format='%(asctime)s - %(levelname)s - %(message)s')
 try:
     from pydub import AudioSegment
     PYDUB_AVAILABLE = True
-    logging.info("pydub با موفقیت ایمپورت شد.")
 except ImportError:
     PYDUB_AVAILABLE = False
-    logging.warning("pydub یافت نشد. قابلیت ادغام فایل‌های صوتی غیرفعال خواهد بود.")
 SPEAKER_VOICES = [
     "Achird", "Zubenelgenubi", "Vindemiatrix", "Sadachbia", "Sadaltager",
     "Sulafat", "Laomedeia", "Achernar", "Alnilam", "Schedar", "Gacrux",
@@ -27,22 +77,22 @@ SPEAKER_VOICES = [
     "Rasalthgeti", "Orus", "Aoede", "Callirrhoe", "Autonoe", "Enceladus",
     "Iapetus", "Zephyr", "Puck", "Charon", "Kore", "Fenrir", "Leda"
 ]
-FIXED_MODEL_NAME = "gemini-2.5-flash-preview-tts"
 DEFAULT_MAX_CHUNK_SIZE = 3800
-DEFAULT_SLEEP_BETWEEN_REQUESTS = 7
-DEFAULT_OUTPUT_FILENAME_BASE = "alpha_tts_audio_gtts"
-def _log_internal(message, log_list_ref):
     log_list_ref.append(message)
-    logging.info(f"[CORE_LOG] {message}")
 def save_binary_file(file_name, data, log_list_ref):
     try:
         with open(file_name, "wb") as f: f.write(data)
-        _log_internal(f"فایل ذخیره شد: {os.path.basename(file_name)}", log_list_ref)
         return file_name
     except Exception as e:
-        _log_internal(f"خطا در ذخیره فایل {os.path.basename(file_name)}: {e}", log_list_ref)
         return None
 def convert_to_wav(audio_data: bytes, mime_type: str) -> bytes:
@@ -69,276 +119,485 @@ def parse_audio_mime_type(mime_type: str) -> dict[str, int]:
 def smart_text_split(text, max_size=3800, log_list_ref=None):
     if len(text) <= max_size: return [text]
     chunks, current_chunk = [], ""
-    sentences = re.split(r'(?<=[.!?؟])\s+', text)
     for sentence in sentences:
         if len(current_chunk) + len(sentence) + 1 > max_size:
             if current_chunk: chunks.append(current_chunk.strip())
             current_chunk = sentence
             while len(current_chunk) > max_size:
-                split_idx = next((i for i in range(max_size - 1, max_size // 2, -1) if current_chunk[i] in ['،', ',', ';', ':', ' ']), -1)
-                part, current_chunk = (current_chunk[:split_idx+1], current_chunk[split_idx+1:]) if split_idx != -1 else (current_chunk[:max_size], current_chunk[max_size:])
                 chunks.append(part.strip())
-        else: current_chunk += (" " if current_chunk else "") + sentence
     if current_chunk: chunks.append(current_chunk.strip())
     final_chunks = [c for c in chunks if c]
-    if log_list_ref: _log_internal(f"متن به {len(final_chunks)} قطعه تقسیم شد.", log_list_ref)
     return final_chunks
 def merge_audio_files_func(file_paths, output_path, log_list_ref):
-    if not PYDUB_AVAILABLE: _log_internal("pydub در دسترس نیست، ادغام انجام نشد.", log_list_ref); return False
     try:
-        _log_internal(f"ادغام {len(file_paths)} فایل صوتی...", log_list_ref)
         combined = AudioSegment.empty()
         for i, fp in enumerate(file_paths):
-            if os.path.exists(fp): combined += AudioSegment.from_file(fp) + (AudioSegment.silent(duration=150) if i < len(file_paths) - 1 else AudioSegment.empty())
-            else: _log_internal(f"فایل پیدا نشد برای ادغام: {fp}", log_list_ref)
         combined.export(output_path, format="wav")
-        _log_internal(f"فایل با موفقیت در {os.path.basename(output_path)} ادغام شد.", log_list_ref); return True
-    except Exception as e: _log_internal(f"خطا در ادغام فایل‌ها: {e}", log_list_ref); return False
 def core_generate_audio(text_input, prompt_input, selected_voice, temperature_val, log_list_ref):
     output_base_name = DEFAULT_OUTPUT_FILENAME_BASE
     max_chunk, sleep_time = DEFAULT_MAX_CHUNK_SIZE, DEFAULT_SLEEP_BETWEEN_REQUESTS
-    _log_internal("شروع فرآیند تولید صدا...", log_list_ref)
-    api_key = os.environ.get("GEMINI_API_KEY_1")
-    if not api_key: api_key = os.environ.get("GEMINI_API_KEY")
-    if not api_key:
-        _log_internal("خطای حیاتی: هیچ Secret با نام GEMINI_API_KEY_1 یا GEMINI_API_KEY یافت نشد!", log_list_ref)
-        return None
-    _log_internal(f"استفاده از کلید API جمینای (...{api_key[-4:] if api_key else 'N/A'})", log_list_ref)
-    try: client = genai.Client(api_key=api_key)
-    except Exception as e: _log_internal(f"خطا در ایجاد کلاینت جمینای: {e}", log_list_ref); return None
-    if not text_input or not text_input.strip(): _log_internal("متن ورودی خالی است.", log_list_ref); return None
     text_chunks = smart_text_split(text_input, max_chunk, log_list_ref)
-    if not text_chunks: _log_internal("پس از تقسیم‌بندی، متنی برای پردازش وجود ندارد.", log_list_ref); return None
-    generated_files_temp = []
     for i, chunk in enumerate(text_chunks):
-        _log_internal(f"پردازش قطعه {i+1} از {len(text_chunks)}...", log_list_ref)
-        final_text = f'"{prompt_input}"\n{chunk}' if prompt_input and prompt_input.strip() else chunk
-        contents = [types.Content(role="user", parts=[types.Part.from_text(text=final_text)])]
-        config = types.GenerateContentConfig(temperature=temperature_val, response_modalities=["audio"],
-            speech_config=types.SpeechConfig(voice_config=types.VoiceConfig(
-                prebuilt_voice_config=types.PrebuiltVoiceConfig(voice_name=selected_voice))))
-        timestamp = int(time.time() * 1000)
-        temp_fname_base = f"temp_audio_{timestamp}_part{i+1:03d}"
         try:
-            response = client.models.generate_content(model=FIXED_MODEL_NAME, contents=contents, config=config)
-            if response.candidates and response.candidates[0].content and response.candidates[0].content.parts and response.candidates[0].content.parts[0].inline_data:
-                inline_data = response.candidates[0].content.parts[0].inline_data
-                data_buffer = inline_data.data
-                ext = mimetypes.guess_extension(inline_data.mime_type) or ".wav"
-                if "audio/L" in inline_data.mime_type and ext == ".wav": data_buffer = convert_to_wav(data_buffer, inline_data.mime_type)
-                if not ext.startswith("."): ext = "." + ext
-                temp_fpath = save_binary_file(f"{temp_fname_base}{ext}", data_buffer, log_list_ref)
-                if temp_fpath: generated_files_temp.append(temp_fpath)
-            else: _log_internal(f"پاسخ API برای قطعه {i+1} بدون داده صوتی معتبر.", log_list_ref)
-        except Exception as e:
-            _log_internal(f"خطای بحرانی در تولید قطعه {i+1} با جمینای: {e}\n{traceback.format_exc()}", log_list_ref);
-            for fp_clean in generated_files_temp:
-                if os.path.exists(fp_clean):
-                    try: os.remove(fp_clean)
-                    except: _log_internal(f"خطا در پاک کردن فایل موقت {fp_clean} پس از خطا", log_list_ref)
-            return None
-        if i < len(text_chunks) - 1 and len(text_chunks) > 1: time.sleep(sleep_time)
-    if not generated_files_temp: _log_internal("هیچ فایل صوتی موقتی تولید نشد.", log_list_ref); return None
-    _log_internal(f"{len(generated_files_temp)} قطعه صوتی با موفقیت تولید شد.", log_list_ref)
-    final_output_path = f"{output_base_name}_final.wav"
-    if os.path.exists(final_output_path):
-        try: os.remove(final_output_path)
-        except Exception as e_del: _log_internal(f"خطا در حذف فایل خروجی قبلی {final_output_path}: {e_del}", log_list_ref)
-    final_audio_file_to_return = None
-    if len(generated_files_temp) > 1:
         if PYDUB_AVAILABLE:
-            if merge_audio_files_func(generated_files_temp, final_output_path, log_list_ref):
-                final_audio_file_to_return = final_output_path
-            else:
-                _log_internal("ادغام ناموفق بود.", log_list_ref)
-                final_audio_file_to_return = None
-        else:
-            _log_internal("pydub برای ادغام چند قطعه در دسترس نیست.", log_list_ref)
-            final_audio_file_to_return = None
-    elif len(generated_files_temp) == 1:
         try:
-            os.rename(generated_files_temp[0], final_output_path)
-            final_audio_file_to_return = final_output_path
-        except Exception as e_rename:
-            _log_internal(f"خطا در انتقال فایل تکی به مسیر نهایی: {e_rename}", log_list_ref)
-            final_audio_file_to_return = None
-            if os.path.exists(generated_files_temp[0]):
-                try: os.remove(generated_files_temp[0])
-                except: pass
-    # پاک کردن تمام فایل‌های موقت که در generated_files_temp لیست شده‌اند
-    # این حلقه باید در این سطح تورفتگی باشد
-    for temp_f in generated_files_temp:
-        if os.path.exists(temp_f) and (not final_audio_file_to_return or os.path.abspath(temp_f) != os.path.abspath(final_audio_file_to_return)):
-            try:
-                os.remove(temp_f)
-                _log_internal(f"فایل موقت {os.path.basename(temp_f)} پاک شد.", log_list_ref)
-            except Exception as e_clean:
-                _log_internal(f"خطا در پاک کردن فایل موقت {os.path.basename(temp_f)}: {e_clean}", log_list_ref)
-    if final_audio_file_to_return and not os.path.exists(final_audio_file_to_return):
-        _log_internal(f"فایل نهایی '{final_audio_file_to_return}' پس از پردازش وجود ندارد!", log_list_ref)
-        return None
-    return final_audio_file_to_return
-def gradio_tts_interface(use_file_input, uploaded_file, text_to_speak, speech_prompt, speaker_voice, temperature, progress=gr.Progress(track_tqdm=True)):
-    logs = []
     actual_text = ""
     if use_file_input:
-        if uploaded_file:
             try:
-                with open(uploaded_file.name, 'r', encoding='utf-8') as f: actual_text = f.read().strip()
-                if not actual_text: _log_internal("فایل آپلود شده خالی است.", logs); return None
-            except Exception as e: _log_internal(f"خطا در خواندن فایل آپلود شده: {e}", logs); return None
-        else: _log_internal("گزینه فایل انتخاب شده اما فایلی آپلود نشده.", logs); return None
     else:
         actual_text = text_to_speak
-        if not actual_text or not actual_text.strip(): _log_internal("متن ورودی برای تبدیل خالی است.", logs); return None
-    final_audio_path = core_generate_audio(actual_text, speech_prompt, speaker_voice, temperature, logs)
-    if final_audio_path:
-        logging.info(f"فایل صوتی نهایی برای ارسال به کاربر: {final_audio_path}")
-        return final_audio_path
-    else:
-        logging.warning("هیچ فایل صوتی نهایی برای ارسال به کاربر تولید نشد.")
-        return None
-APP_HEADER_GRADIENT_START = "#4F46E5"
-APP_HEADER_GRADIENT_END = "#10B981"
-PANEL_BACKGROUND = "#FFFFFF"
-TEXT_INPUT_BG = "#F3F4F6"
-BUTTON_BG = "#2979FF"
-MAIN_BACKGROUND = "linear-gradient(170deg, #E0F2FE 0%, #F3E8FF 100%)"
-TEXT_PRIMARY = "#1F2937"
-TEXT_SECONDARY = "#6B7280"
-BORDER_COLOR = "#D1D5DB"
-RADIUS_CARD = "20px"
-RADIUS_INPUT = "10px"
-SHADOW_CARD = "0 10px 30px -5px rgba(0,0,0,0.1)"
-SHADOW_BUTTON = f"0 4px 10px -2px rgba({int(BUTTON_BG[1:3],16)},{int(BUTTON_BG[3:5],16)},{int(BUTTON_BG[5:7],16)},0.5)"
-LABEL_TEXT_INPUT = "📝 متن فارسی برای تبدیل"
-LABEL_SPEECH_PROMPT = "🗣️ سبک گفتار (اختیاری)"
-LABEL_SPEAKER_VOICE = "🎤 انتخاب گوینده و لهجه"
-LABEL_TEMPERATURE = "🌡️ خلاقیت و تنوع صدا"
-LABEL_FILE_UPLOAD = "📄 استفاده از فایل متنی (.txt)"
-custom_css_final_attempt = f"""
-@import url('https://fonts.googleapis.com/css2?family=Vazirmatn:wght@300;400;500;700;800&display=swap');
 :root {{
-    --app-font: 'Vazirmatn', sans-serif;
-    --app-header-grad-start: {APP_HEADER_GRADIENT_START}; --app-header-grad-end: {APP_HEADER_GRADIENT_END};
-    --app-panel-bg: {PANEL_BACKGROUND}; --app-input-bg: {TEXT_INPUT_BG};
-    --app-button-bg: {BUTTON_BG}; --app-main-bg: {MAIN_BACKGROUND};
-    --app-text-primary: {TEXT_PRIMARY}; --app-text-secondary: {TEXT_SECONDARY};
-    --app-border-color: {BORDER_COLOR};
-    --radius-card: {RADIUS_CARD}; --radius-input: {RADIUS_INPUT};
-    --shadow-card: {SHADOW_CARD}; --shadow-button: {SHADOW_BUTTON};
-}}
-body, .gradio-container {{ font-family: var(--app-font); direction: rtl; background: var(--app-main-bg); color: var(--app-text-primary); font-size: 15px; line-height: 1.6; }}
-.gradio-container {{ max-width:100% !important; min-height:100vh; margin:0 !important; padding:0 !important; display:flex; flex-direction:column; }}
-.app-header-container {{ padding: 2.8rem 1.5rem 3.5rem 1.5rem; text-align: center; background-image: linear-gradient(135deg, var(--app-header-grad-start) 0%, var(--app-header-grad-end) 100%); color: white; border-bottom-left-radius: var(--radius-card); border-bottom-right-radius: var(--radius-card); box-shadow: 0 6px 20px -5px rgba(0,0,0,0.25); }}
-.app-header-container h1 {{ font-size: 2.3em; font-weight: 800; margin:0 0 0.4rem 0; text-shadow: 0 1px 3px rgba(0,0,0,0.2); }}
-.app-header-container p {{ font-size: 1.05em; color: rgba(255,255,255,0.9); margin-top:0; opacity: 0.95; }}
-.main-content-wrapper-alpha {{ padding: 1.8rem 1.5rem; max-width: 650px; margin: -2.5rem auto 2rem auto; width: 90%; background-color: var(--app-panel-bg); border-radius: var(--radius-card); box-shadow: var(--shadow-card); position:relative; z-index:10; }}
-@media (max-width: 768px) {{
-    .main-content-wrapper-alpha {{ width: 92%; padding: 1.5rem 1.2rem; margin-top: -2rem; }}
-    .app-header-container h1 {{font-size:2em;}}
-    .app-header-container p {{font-size:1em;}}
-}}
-footer {{display:none !important;}}
-.gradio-button.generate-button-final-alpha {{ background: var(--app-button-bg) !important; color: white !important; border:none !important; border-radius: var(--radius-input) !important; padding: 0.85rem 1.5rem !important; font-weight: 700 !important; font-size:1.05em !important; transition: all 0.25s ease; box-shadow: var(--shadow-button); width:100%; margin-top:1.8rem !important; }}
-.gradio-button.generate-button-final-alpha:hover {{ filter: brightness(1.15); transform: translateY(-2px); box-shadow: 0 6px 12px -3px rgba({int(BUTTON_BG[1:3],16)},{int(BUTTON_BG[3:5],16)},{int(BUTTON_BG[5:7],16)},0.65);}}
-.gradio-textbox > label + div > textarea,
-.gradio-dropdown > label + div > div > input,
-.gradio-dropdown select,
-.gradio-file > label + div {{
-    border-radius: var(--radius-input) !important;
-    border: 1px solid var(--app-border-color) !important;
-    background-color: var(--app-input-bg) !important;
-    box-shadow: inset 0 1px 3px rgba(0,0,0,0.06);
-    padding: 0.8rem !important;
-    font-size: 0.95em !important;
 }}
-.gradio-dropdown .wrap-inner {{ border-radius: var(--radius-input) !important; }}
-.gradio-file > label + div {{ text-align:center; border-style: dashed !important; padding: 1.2rem !important; }}
-.gradio-file span[data-testid="block-title"] {{ font-weight:500; color: var(--app-text-secondary); font-size:0.9em; }}
-.gradio-file button.svelte-116rqfv {{ background: var(--app-button-bg) !important; color:white !important; border-radius:6px !important; padding: 0.4rem 0.8rem !important; font-size:0.85em !important; }}
-.gradio-textbox > label + div > textarea:focus,
-.gradio-dropdown > label + div > div > input:focus {{
-    border-color: var(--app-button-bg) !important;
-    box-shadow: 0 0 0 3.5px rgba({int(BUTTON_BG[1:3],16)},{int(BUTTON_BG[3:5],16)},{int(BUTTON_BG[5:7],16)},0.25) !important;
 }}
-label.gradio-label > .label-text {{ font-weight: 500 !important; color: var(--app-text-primary) !important; font-size: 0.98em !important; margin-bottom: 0.6rem !important; display: block; }}
-.gradio-textbox[elem_id="text_input_alpha_final"] > label > .label-text::before,
-.gradio-checkbox[elem_id="use_file_cb_alpha_final"] > label > .label-text > span::before,
-.gradio-textbox[elem_id="speech_prompt_alpha_final"] > label > .label-text::before,
-.gradio-dropdown[elem_id="speaker_voice_alpha_final"] > label > .label-text::before,
-.gradio-slider[elem_id="temperature_slider_alpha_final"] > label > .label-text > span::before {{
-    margin-left: 10px; vertical-align: -2px; font-size: 1.1em; opacity: 0.8;
-}}
-.gradio-textbox[elem_id="text_input_alpha_final"] > label > .label-text::before {{ content: '📝'; }}
-.gradio-checkbox[elem_id="use_file_cb_alpha_final"] > label > .label-text > span::before {{ content: '📄'; }}
-.gradio-textbox[elem_id="speech_prompt_alpha_final"] > label > .label-text::before {{ content: '🗣️'; }}
-.gradio-dropdown[elem_id="speaker_voice_alpha_final"] > label > .label-text::before {{ content: '🎤'; }}
-.gradio-slider[elem_id="temperature_slider_alpha_final"] > label > .label-text > span::before {{ content: '🌡️'; }}
-#output_audio_player_alpha_final audio {{ width: 100%; border-radius: var(--radius-input); margin-top:1rem; box-shadow: 0 2px 5px rgba(0,0,0,0.08); }}
-.temp_description_class_alpha_final {{ font-size: 0.88em; color: var(--app-text-secondary); margin-top: -0.3rem; margin-bottom: 1.2rem; }}
-.app-footer-container-final {{text-align:center;font-size:0.9em;color: var(--app-text-secondary);opacity:0.9; margin-top:3.5rem;padding:1.5rem 0; border-top:1px solid var(--app-border-color);}}
-.gradio-examples {{ margin-top: 2.5rem !important; }}
-.gradio-examples > .gradio-label > .label-text {{ font-size: 1.1em !important; font-weight: 700 !important; color: var(--app-text-primary) !important; text-align:center; margin-bottom: 1rem !important; }}
-.gradio-examples table th {{ background-color: var(--app-input-bg) !important; font-weight:700 !important; font-size:0.9em !important; padding: 0.6rem 0.5rem !important; text-align:right !important; }}
-.gradio-examples table td {{ padding: 0.6rem 0.5rem !important; font-size:0.9em !important; }}
-.gradio-examples .gr-sample-button {{ background-color: rgba({int(BUTTON_BG[1:3],16)},{int(BUTTON_BG[3:5],16)},{int(BUTTON_BG[5:7],16)}, 0.1) !important; color: var(--app-button-bg) !important; border: 1px solid rgba({int(BUTTON_BG[1:3],16)},{int(BUTTON_BG[3:5],16)},{int(BUTTON_BG[5:7],16)}, 0.3) !important; font-weight:500 !important; }}
-#output_audio_player_alpha_final > .gradio-label {{ display: none !important; }}
-#file_uploader_alpha_final > .gradio-label {{ display: none !important; }}
 """
-alpha_header_html_final = """
-<div class='app-header-container'>
-  <h1>Alpha Translator</h1>
-  <p>جادوی ترجمه و تلفظ در دستان شما</p>
-</div>
-"""
-with gr.Blocks(theme=gr.themes.Base(font=[gr.themes.GoogleFont("Vazirmatn")]), css=custom_css_final_attempt, title="Alpha TTS") as demo:
-    gr.HTML(alpha_header_html_final)
-    with gr.Column(elem_classes=["main-content-wrapper-alpha"]):
-        use_file_input_cb = gr.Checkbox(label=LABEL_FILE_UPLOAD, value=False, elem_id="use_file_cb_alpha_final")
-        uploaded_file_input = gr.File(label=" ", file_types=['.txt'], visible=False, elem_id="file_uploader_alpha_final" )
-        text_to_speak_tb = gr.Textbox(label=LABEL_TEXT_INPUT, placeholder="مثال: سلام، فردا هوا چطور است؟", lines=5, value="", visible=True, elem_id="text_input_alpha_final")
-        use_file_input_cb.change(fn=lambda x: (gr.update(visible=x), gr.update(visible=not x)), inputs=use_file_input_cb, outputs=[uploaded_file_input, text_to_speak_tb])
-        speech_prompt_tb = gr.Textbox(label=LABEL_SPEECH_PROMPT, placeholder="مثال: با لحنی شاد و پرانرژی", value="با لحنی دوستانه و رسا صحبت کن.", lines=2, elem_id="speech_prompt_alpha_final")
-        speaker_voice_dd = gr.Dropdown(SPEAKER_VOICES, label=LABEL_SPEAKER_VOICE, value="Charon", elem_id="speaker_voice_alpha_final")
-        temperature_slider = gr.Slider(minimum=0.1, maximum=1.5, step=0.05, value=0.9, label=LABEL_TEMPERATURE, elem_id="temperature_slider_alpha_final")
-        gr.Markdown("<p class='temp_description_class_alpha_final'>مقادیر بالاتر = تنوع بیشتر، مقادیر پایین‌تر = یکنواختی بیشتر.</p>")
-        generate_button = gr.Button("🚀 تولید و پخش صدا", elem_classes=["generate-button-final-alpha"], elem_id="generate_button_alpha_final")
-        output_audio = gr.Audio(type="filepath", elem_id="output_audio_player_alpha_final", label=" ")
-        generate_button.click(fn=gradio_tts_interface, inputs=[ use_file_input_cb, uploaded_file_input, text_to_speak_tb, speech_prompt_tb, speaker_voice_dd, temperature_slider ], outputs=[output_audio] )
-        gr.Examples(
-            label="نمونه‌های کاربردی",
-            examples=[
-                [False, None, "قیمت این لباس چقدر است؟", "با لحنی مودبانه و سوالی.", "Zubenelgenubi", 0.75],
-                [False, None, "می‌توانید آدرس را روی نقشه به من نشان دهید؟", "واضح و با سرعت متوسط.", "Achird", 0.8],
-                [False, None, "ببخشید، متوجه نشدم. امکان دارد تکرار کنید؟", "کمی آهسته‌تر و شمرده.", "Vindemiatrix", 0.6],
-            ],
-            inputs=[ use_file_input_cb, uploaded_file_input, text_to_speak_tb, speech_prompt_tb, speaker_voice_dd, temperature_slider ],
-            outputs=[output_audio],
             fn=gradio_tts_interface,
-            cache_examples=os.getenv("GRADIO_CACHE_EXAMPLES", "False").lower() == "true"
         )
-    gr.Markdown("<p class='app-footer-container-final'>Alpha Language Learning © 2025</p>")
 if __name__ == "__main__":
-    logging.info("اپلیکیشن Alpha TTS در حال راه‌اندازی است...")
-    if not os.environ.get("GEMINI_API_KEY_1") and not os.environ.get("GEMINI_API_KEY"):
-         logging.warning("هشدار: هیچ کلید API جمینای (GEMINI_API_KEY_1 یا GEMINI_API_KEY) در متغیرهای محیطی یافت نشد. اپلیکیشن ممکن است کار نکند.")
-    demo.launch(server_name="0.0.0.0", server_port=int(os.getenv("PORT", 7860)), debug=os.environ.get("GRADIO_DEBUG", "False").lower() == "true", show_error=True )

 import gradio as gr
 import os
 import time
+import threading
+import sys
 import logging
+import traceback
+import asyncio
+# TTS specific imports from second script
+import mimetypes
+import re
+import struct
+# import zipfile # Not directly used in final combined code
+from google import genai # For TTS
+from google.genai import types as genai_types # For TTS
 try:
     from pydub import AudioSegment
     PYDUB_AVAILABLE = True
 except ImportError:
     PYDUB_AVAILABLE = False
+    logging.warning("Pydub is not available. Audio merging will be disabled. Falling back to single file or ZIP.")
+# --- START: پیکربندی لاگینگ (From Alpha Translator) ---
+logging.basicConfig(level=logging.INFO, format='%(asctime)s - %(levelname)s - %(threadName)s - %(message)s')
+# --- END: پیکربندی لاگینگ ---
+# --- START: منطق چرخش API Key ---
+API_KEYS_GEMINI = []
+i = 1
+while True:
+    key = os.environ.get(f'GEMINI_API_KEY_{i}')
+    if key:
+        API_KEYS_GEMINI.append(key)
+        i += 1
+    else:
+        break
+NUM_GEMINI_KEYS = len(API_KEYS_GEMINI)
+current_gemini_key_index = 0
+gemini_key_lock = threading.Lock()
+if NUM_GEMINI_KEYS == 0:
+    logging.error(
+        'خطای حیاتی: هیچ Secret با نام GEMINI_API_KEY_n (مثلاً GEMINI_API_KEY_1) یافت نشد! ' +
+        'قابلیت تبدیل متن به گفتار غیرفعال خواهد بود. لطفاً Secret ها را در تنظیمات Space خود اضافه کنید.'
+    )
+else:
+    logging.info(f"تعداد {NUM_GEMINI_KEYS} کلید API جیمینای بارگذاری شد.")
+def get_gemini_api_key_sync():
+    if NUM_GEMINI_KEYS == 0:
+        return None
+    with gemini_key_lock:
+        global current_gemini_key_index
+        selected_api_key = API_KEYS_GEMINI[current_gemini_key_index]
+        current_gemini_key_index = (current_gemini_key_index + 1) % NUM_GEMINI_KEYS
+        logging.info(f"TTS Gemini: استفاده از کلید API با اندیس چرخشی: ...{selected_api_key[-4:]}")
+        return selected_api_key
+# --- END: منطق چرخش API Key ---
+# --- START: تابع ری‌استارت خودکار ---
+def auto_restart_service():
+    RESTART_INTERVAL_SECONDS = 24 * 60 * 60
+    logging.info(f"سرویس برای ری‌استارت خودکار پس از {RESTART_INTERVAL_SECONDS / 3600:.0f} ساعت زمان‌بندی شده است.")
+    time.sleep(RESTART_INTERVAL_SECONDS)
+    logging.info(f"زمان ری‌استارت خودکار ({RESTART_INTERVAL_SECONDS / 3600:.0f} ساعت) فرا رسیده است. برنامه خارج می‌شود تا توسط پلتفرم ری‌استارت شود...")
+    os._exit(1)
+# --- END: تابع ری‌استارت خودکار ---
+# --- START: TTS Core Logic ---
 SPEAKER_VOICES = [
     "Achird", "Zubenelgenubi", "Vindemiatrix", "Sadachbia", "Sadaltager",
     "Sulafat", "Laomedeia", "Achernar", "Alnilam", "Schedar", "Gacrux",
     "Rasalthgeti", "Orus", "Aoede", "Callirrhoe", "Autonoe", "Enceladus",
     "Iapetus", "Zephyr", "Puck", "Charon", "Kore", "Fenrir", "Leda"
 ]
+FIXED_MODEL_NAME = "gemini-1.5-flash-preview-tts" # This specific model name needs to be accurate
 DEFAULT_MAX_CHUNK_SIZE = 3800
+DEFAULT_SLEEP_BETWEEN_REQUESTS = 8
+DEFAULT_OUTPUT_FILENAME_BASE = "alpha_tts_audio"
+def _log_tts(message, log_list_ref):
     log_list_ref.append(message)
+    logging.info(f"[TTS_CORE] {message}")
 def save_binary_file(file_name, data, log_list_ref):
     try:
         with open(file_name, "wb") as f: f.write(data)
+        _log_tts(f"✅ فایل ذخیره شد: {file_name}", log_list_ref)
         return file_name
     except Exception as e:
+        _log_tts(f"❌ خطا در ذخیره فایل {file_name}: {e}", log_list_ref)
         return None
 def convert_to_wav(audio_data: bytes, mime_type: str) -> bytes:
 def smart_text_split(text, max_size=3800, log_list_ref=None):
     if len(text) <= max_size: return [text]
     chunks, current_chunk = [], ""
+    sentences = re.split(r'(?<=[.!?؟۔])\s+', text)
     for sentence in sentences:
         if len(current_chunk) + len(sentence) + 1 > max_size:
             if current_chunk: chunks.append(current_chunk.strip())
             current_chunk = sentence
             while len(current_chunk) > max_size:
+                split_idx = -1
+                for punc in ['،', ',', ';', ':', ' ']:
+                    idx = current_chunk.rfind(punc, max_size // 2, max_size)
+                    if idx > split_idx : split_idx = idx
+                if split_idx != -1:
+                    part, current_chunk = current_chunk[:split_idx+1], current_chunk[split_idx+1:]
+                else:
+                    part, current_chunk = current_chunk[:max_size], current_chunk[max_size:]
                 chunks.append(part.strip())
+        else:
+            current_chunk += (" " if current_chunk and sentence else "") + sentence
     if current_chunk: chunks.append(current_chunk.strip())
     final_chunks = [c for c in chunks if c]
+    if log_list_ref: _log_tts(f"📊 متن به {len(final_chunks)} قطعه تقسیم شد.", log_list_ref)
     return final_chunks
 def merge_audio_files_func(file_paths, output_path, log_list_ref):
+    if not PYDUB_AVAILABLE:
+        _log_tts("❌ Pydub در دسترس نیست. ادغام فایل انجام نشد.", log_list_ref)
+        return False
     try:
+        _log_tts(f"🔗 شروع ادغام {len(file_paths)} فایل صوتی...", log_list_ref)
         combined = AudioSegment.empty()
         for i, fp in enumerate(file_paths):
+            if os.path.exists(fp):
+                segment = AudioSegment.from_file(fp)
+                combined += segment
+                if i < len(file_paths) - 1:
+                    combined += AudioSegment.silent(duration=150)
+            else:
+                _log_tts(f"⚠️ فایل صوتی برای ادغام یافت نشد: {fp}", log_list_ref)
         combined.export(output_path, format="wav")
+        _log_tts(f"✅ فایل صوتی با موفقیت در '{output_path}' ادغام و ذخیره شد.", log_list_ref)
+        return True
+    except Exception as e:
+        _log_tts(f"❌ خطا در هنگام ادغام فایل‌های صوتی: {e}\n{traceback.format_exc()}", log_list_ref)
+        return False
 def core_generate_audio(text_input, prompt_input, selected_voice, temperature_val, log_list_ref):
     output_base_name = DEFAULT_OUTPUT_FILENAME_BASE
     max_chunk, sleep_time = DEFAULT_MAX_CHUNK_SIZE, DEFAULT_SLEEP_BETWEEN_REQUESTS
+    _log_tts("🚀 شروع فرآیند تولید صدا...", log_list_ref)
+    api_key = get_gemini_api_key_sync()
+    if not api_key:
+        _log_tts("❌ کلید API جیمینای معتبری یافت نشد یا دریافت نشد. عملیات متوقف شد.", log_list_ref)
+        return None, "خطا: کلید API جیمینای برای سرویس TTS در دسترس نیست."
+    # REMOVED: genai.configure(api_key=api_key) - This was causing the error.
+    if not text_input or not text_input.strip():
+        _log_tts("❌ متن ورودی برای تبدیل به گفتار خالی است.", log_list_ref)
+        return None, "خطا: متن ورودی خالی است."
     text_chunks = smart_text_split(text_input, max_chunk, log_list_ref)
+    if not text_chunks:
+        _log_tts("❌ متن قابل پردازش برای تبدیل به گفتار نیست.", log_list_ref)
+        return None, "خطا: متن قابل پردازش نیست."
+    generated_files = []
     for i, chunk in enumerate(text_chunks):
+        _log_tts(f"🔊 پردازش قطعه {i+1}/{len(text_chunks)}...", log_list_ref)
+        final_text_for_tts = f'"{prompt_input}"\n{chunk}' if prompt_input and prompt_input.strip() else chunk
         try:
+            # Pass api_key directly to the model instance
+            # Also, FIXED_MODEL_NAME should be just the model ID like "gemini-1.5-flash-preview-tts"
+            # The SDK often prefixes with "models/" internally or expects it.
+            # The `genai.GenerativeModel` constructor takes `model_name`.
+            # If `FIXED_MODEL_NAME` is `gemini-1.5-flash-preview-tts`, it's correct.
+            tts_model = genai.GenerativeModel(FIXED_MODEL_NAME, api_key=api_key)
+            # IMPORTANT: The `selected_voice` (e.g., "Achird", "Zephyr") from the SPEAKER_VOICES list
+            # is still NOT being used in the API call to `tts_model.generate_content`.
+            # To use these voices, you would need to find the correct parameter in the
+            # `generation_config` or the `generate_content` method for the `FIXED_MODEL_NAME`
+            # that specifies the voice. This is highly dependent on the specific model's API.
+            # For example, it could be:
+            # generation_config=genai_types.GenerationConfig(
+            #     temperature=temperature_val,
+            #     response_mime_type="audio/wav",
+            #     voice_name=selected_voice  # This is a HYPOTHETICAL parameter
+            # )
+            # Or it might be part of a more complex `request_options` or `tools` configuration.
+            # Without knowing the exact API for voice selection for "gemini-1.5-flash-preview-tts",
+            # the dropdown will select a voice, but the API will likely use a default voice.
+            _log_tts(f"Selected voice from UI: {selected_voice} (Note: This voice may not be used if API parameter is unknown)", log_list_ref)
+            response = tts_model.generate_content(
+                final_text_for_tts,
+                generation_config=genai_types.GenerationConfig(
+                    temperature=temperature_val,
+                    response_mime_type="audio/wav"
+                ),
+            )
+            fname_base = f"{output_base_name}_part{i+1:03d}"
+            audio_bytes = None
+            mime_type = None
+            # Attempt to extract audio data robustly
+            if response.parts:
+                for part in response.parts:
+                    # Check for new SDK's common blob structure
+                    if hasattr(part, 'blob') and hasattr(part.blob, 'mime_type') and hasattr(part.blob, 'data') and part.blob.mime_type.startswith("audio/"):
+                        audio_bytes = part.blob.data
+                        mime_type = part.blob.mime_type
+                        break
+                    # Check for inline_data (older or different response structure)
+                    elif hasattr(part, 'inline_data') and hasattr(part.inline_data, 'mime_type') and hasattr(part.inline_data, 'data') and part.inline_data.mime_type.startswith("audio/"):
+                        audio_bytes = part.inline_data.data
+                        mime_type = part.inline_data.mime_type
+                        break
+                    # Simpler direct data attribute check (less common but possible)
+                    elif hasattr(part, 'mime_type') and hasattr(part, 'data') and part.mime_type.startswith("audio/"):
+                        audio_bytes = part.data
+                        mime_type = part.mime_type
+                        break
+            # Fallback if candidates structure is present (from AlphaTTS original code)
+            if not audio_bytes and response.candidates and response.candidates[0].content.parts:
+                 for part in response.candidates[0].content.parts:
+                    if hasattr(part, 'inline_data') and hasattr(part.inline_data, 'mime_type') and hasattr(part.inline_data, 'data') and part.inline_data.mime_type.startswith("audio/"):
+                        audio_bytes = part.inline_data.data
+                        mime_type = part.inline_data.mime_type
+                        break
+            if not audio_bytes:
+                _log_tts(f"⚠️ پاسخ API برای قطعه {i+1} بدون داده صوتی معتبر دریافت شد.", log_list_ref)
+                _log_tts(f"ساختار پاسخ (Response structure): {response}", log_list_ref)
+                continue
+            if not mime_type:
+                _log_tts(f"⚠️ MIME type برای قطعه {i+1} یافت نشد. پیش‌فرض wav.", log_list_ref)
+                mime_type = "audio/wav"
+            ext = mimetypes.guess_extension(mime_type) or ".wav"
+            if "audio/L" in mime_type and ext == ".wav":
+                audio_bytes = convert_to_wav(audio_bytes, mime_type)
+            if not ext.startswith("."): ext = "." + ext
+            fpath = save_binary_file(f"{fname_base}{ext}", audio_bytes, log_list_ref)
+            if fpath:
+                generated_files.append(fpath)
+        except Exception as e:
+            _log_tts(f"❌ خطا در تولید قطعه صوتی {i+1} با Gemini: {e}", log_list_ref)
+            # Attempt to get more details from the exception if it's an API error
+            if hasattr(e, 'message'): # Standard Python exception message
+                 _log_tts(f"پیام خطا: {e.message}", log_list_ref)
+            if hasattr(e, 'response'): # Often present in google.api_core.exceptions
+                _log_tts(f"جزئیات پاسخ خطای Gemini API: {e.response}", log_list_ref)
+            # traceback.print_exc() # For more detailed stack trace in logs if needed
+            _log_tts(f"Traceback: {traceback.format_exc()}", log_list_ref)
+            # If the error is due to the API key itself (e.g., quota, invalid)
+            # the key rotation should ideally handle it on the next call, but for TTS chunks,
+            # this chunk fails.
+            continue
+        if i < len(text_chunks) - 1 and len(text_chunks) > 1:
+            _log_tts(f"💤 توقف کوتاه ({sleep_time} ثانیه) قبل از پردازش قطعه بعدی...", log_list_ref)
+            time.sleep(sleep_time)
+    if not generated_files:
+        _log_tts("❌ هیچ فایل صوتی تولید نشد.", log_list_ref)
+        return None, "تولید صدا ناموفق بود. هیچ فایلی ایجاد نشد."
+    _log_tts(f"🎉 {len(generated_files)} فایل(های) صوتی با موفقیت تولید شد.", log_list_ref)
+    final_audio_file = None
+    final_output_path_base = f"{output_base_name}_final"
+    if len(generated_files) > 1:
         if PYDUB_AVAILABLE:
+            merged_fn = f"{final_output_path_base}.wav"
+            if os.path.exists(merged_fn):
+                try: os.remove(merged_fn)
+                except OSError as e: _log_tts(f"⚠️ عدم امکان حذف فایل ادغام شده قبلی '{merged_fn}': {e}", log_list_ref)
+            if merge_audio_files_func(generated_files, merged_fn, log_list_ref):
+                final_audio_file = merged_fn
+                for fp in generated_files:
+                    if os.path.abspath(fp) != os.path.abspath(merged_fn):
+                        try: os.remove(fp)
+                        except OSError as e_del: _log_tts(f"⚠️ عدم امکان حذف فایل موقت '{fp}': {e_del}", log_list_ref)
+            else:
+                _log_tts("⚠️ ادغام فایل‌های صوتی ناموفق بود. اولین قطعه ارائه می‌شود.", log_list_ref)
+                if generated_files:
+                    try:
+                        first_chunk_path = generated_files[0]
+                        target_ext = os.path.splitext(first_chunk_path)[1]
+                        fallback_fn = f"{final_output_path_base}_fallback{target_ext}"
+                        if os.path.exists(fallback_fn): os.remove(fallback_fn)
+                        os.rename(first_chunk_path, fallback_fn)
+                        final_audio_file = fallback_fn
+                        for i_gf in range(1, len(generated_files)):
+                             try: os.remove(generated_files[i_gf])
+                             except OSError as e_del: _log_tts(f"⚠️ عدم امکان حذف فایل موقت '{generated_files[i_gf]}': {e_del}", log_list_ref)
+                    except Exception as e_rename_fallback:
+                        _log_tts(f"خطا در تغییر نام فایل اولین قطعه (fallback): {e_rename_fallback}", log_list_ref)
+                        final_audio_file = generated_files[0]
+        else:
+            _log_tts("⚠️ Pydub برای ادغام در دسترس نیست. اولین قطعه صوتی ارائه می‌شود.", log_list_ref)
+            if generated_files:
+                try:
+                    first_chunk_path = generated_files[0]
+                    target_ext = os.path.splitext(first_chunk_path)[1]
+                    single_fallback_fn = f"{final_output_path_base}_single{target_ext}"
+                    if os.path.exists(single_fallback_fn): os.remove(single_fallback_fn)
+                    os.rename(first_chunk_path, single_fallback_fn)
+                    final_audio_file = single_fallback_fn
+                    for i_gf in range(1, len(generated_files)):
+                        _log_tts(f"قطعه اضافی موجود: {generated_files[i_gf]} (ادغام نشده)", log_list_ref)
+                except Exception as e_rename_nopydub:
+                    _log_tts(f"خطا در تغییر نام اولین قطعه (بدون pydub): {e_rename_nopydub}", log_list_ref)
+                    final_audio_file = generated_files[0]
+    elif len(generated_files) == 1:
         try:
+            single_file_path = generated_files[0]
+            target_ext = os.path.splitext(single_file_path)[1]
+            final_single_fn = f"{final_output_path_base}{target_ext}"
+            if os.path.exists(final_single_fn) and os.path.abspath(single_file_path) != os.path.abspath(final_single_fn):
+                 os.remove(final_single_fn)
+            if os.path.abspath(single_file_path) != os.path.abspath(final_single_fn):
+                 os.rename(single_file_path, final_single_fn)
+            final_audio_file = final_single_fn
+        except Exception as e_rename_single:
+            _log_tts(f"خطا در تغییر نام فایل تکی نهایی: {e_rename_single}", log_list_ref)
+            final_audio_file = generated_files[0]
+    if final_audio_file and not os.path.exists(final_audio_file):
+        _log_tts(f"⚠️ فایل صوتی نهایی '{final_audio_file}' پس از پردازش وجود ندارد!", log_list_ref)
+        return None, "خطا: فایل صوتی نهایی یافت نشد."
+    return final_audio_file, "موفق"
+def gradio_tts_interface(use_file_input, uploaded_file, text_to_speak, speech_prompt, speaker_voice, temperature):
+    logs_for_this_run = []
     actual_text = ""
+    # status_message = "شروع پردازش..." # Will be set by core_generate_audio return
+    # final_audio_path = None # Will be set by core_generate_audio return
+    if NUM_GEMINI_KEYS == 0:
+        return None, "خطای پیکربندی: هیچ کلید API جیمینای برای سرویس TTS تنظیم نشده است."
     if use_file_input:
+        if uploaded_file and hasattr(uploaded_file, 'name'):
             try:
+                # Ensure uploaded_file.name is a valid path after upload by Gradio
+                # Gradio usually provides a temporary file path.
+                with open(uploaded_file.name, 'r', encoding='utf-8') as f:
+                    actual_text = f.read().strip()
+                if not actual_text:
+                    return None, "خطا: فایل متنی انتخاب شده خالی است."
+                _log_tts(f"خوانش متن از فایل: {uploaded_file.name}", logs_for_this_run)
+            except Exception as e:
+                _log_tts(f"❌ خطا در خواندن فایل متنی: {e}", logs_for_this_run)
+                return None, f"خطا در خواندن فایل: {e}"
+        else:
+            return None, "خطا: فایل متنی انتخاب نشده است در حالی که گزینه استفاده از فایل فعال است."
     else:
         actual_text = text_to_speak
+        if not actual_text or not actual_text.strip():
+            return None, "خطا: لطفاً متنی را برای تبدیل به گفتار وارد کنید."
+    _log_tts(f"متن ورودی برای TTS (اولین 50 کاراکتر): '{actual_text[:50]}...'", logs_for_this_run)
+    _log_tts(f"تنظیمات: Speaker={speaker_voice}, Temp={temperature}, Prompt='{speech_prompt[:30]}...'", logs_for_this_run)
+    try:
+        final_audio_path, generation_status_msg = core_generate_audio(
+            actual_text, speech_prompt, speaker_voice, temperature, logs_for_this_run
+        )
+        if final_audio_path and generation_status_msg == "موفق":
+            status_message_ui = "✅ تبدیل متن به گفتار با موفقیت انجام شد."
+            _log_tts(status_message_ui, logs_for_this_run)
+            return final_audio_path, status_message_ui
+        elif final_audio_path and generation_status_msg != "موفق":
+            status_message_ui = f"⚠️ {generation_status_msg} فایل صوتی ممکن است ناقص باشد."
+            _log_tts(status_message_ui + f" Path: {final_audio_path}", logs_for_this_run)
+            return final_audio_path, status_message_ui
+        else: # No file path, error occurred
+            status_message_ui = f"❌ {generation_status_msg}"
+            _log_tts(status_message_ui, logs_for_this_run)
+            return None, status_message_ui
+    except Exception as e:
+        _log_tts(f"❌ خطای پیش‌بینی نشده در gradio_tts_interface: {e}\n{traceback.format_exc()}", logs_for_this_run)
+        return None, f"خطای داخلی سرویس: {type(e).__name__}"
+# --- END: TTS Core Logic ---
+# --- START: بخش UI و Gradio ---
+FLY_PRIMARY_COLOR_HEX = "#4F46E5"
+FLY_SECONDARY_COLOR_HEX = "#10B981"
+FLY_ACCENT_COLOR_HEX = "#D97706"
+FLY_TEXT_COLOR_HEX = "#1F2937"
+FLY_SUBTLE_TEXT_HEX = "#6B7280"
+FLY_LIGHT_BACKGROUND_HEX = "#F9FAFB"
+FLY_WHITE_HEX = "#FFFFFF"
+FLY_BORDER_COLOR_HEX = "#D1D5DB"
+FLY_INPUT_BG_HEX_SIMPLE = "#F3F4F6"
+FLY_PANEL_BG_SIMPLE = "#E0F2FE"
+app_theme_outer = gr.themes.Base(
+    font=[gr.themes.GoogleFont("Inter"), "system-ui", "sans-serif"],
+).set(
+    body_background_fill=FLY_LIGHT_BACKGROUND_HEX,
+)
+custom_css = f"""
+@import url('https://fonts.googleapis.com/css2?family=Vazirmatn:wght@300;400;500;600;700;800&display=swap');
+@import url('https://fonts.googleapis.com/css2?family=Poppins:wght@400;500;600;700;800&display=swap');
+@import url('https://fonts.googleapis.com/css2?family=Inter:wght@400;500;600;700;800&display=swap');
 :root {{
+    --fly-primary: {FLY_PRIMARY_COLOR_HEX}; --fly-secondary: {FLY_SECONDARY_COLOR_HEX};
+    --fly-accent: {FLY_ACCENT_COLOR_HEX}; --fly-text-primary: {FLY_TEXT_COLOR_HEX};
+    --fly-text-secondary: {FLY_SUBTLE_TEXT_HEX}; --fly-bg-light: {FLY_LIGHT_BACKGROUND_HEX};
+    --fly-bg-white: {FLY_WHITE_HEX}; --fly-border-color: {FLY_BORDER_COLOR_HEX};
+    --fly-input-bg-simple: {FLY_INPUT_BG_HEX_SIMPLE}; --fly-panel-bg-simple: {FLY_PANEL_BG_SIMPLE};
+    --font-global: 'Vazirmatn', 'Inter', 'Poppins', system-ui, sans-serif;
+    --font-english: 'Poppins', 'Inter', system-ui, sans-serif;
+    --radius-sm: 0.375rem; --radius-md: 0.5rem; --radius-lg: 0.75rem; --radius-xl: 1rem; --radius-full: 9999px;
+    --shadow-sm: 0 1px 2px 0 rgba(0,0,0,0.05); --shadow-md: 0 4px 6px -1px rgba(0,0,0,0.1),0 2px 4px -2px rgba(0,0,0,0.1);
+    --shadow-lg: 0 10px 15px -3px rgba(0,0,0,0.1),0 4px 6px -4px rgba(0,0,0,0.1);
+    --shadow-xl: 0 20px 25px -5px rgba(0,0,0,0.1),0 8px 10px -6px rgba(0,0,0,0.1);
+    --fly-primary-rgb: 79,70,229; --fly-accent-rgb: 217,119,6;
 }}
+body {{font-family:var(--font-global);direction:rtl;background-color:var(--fly-bg-light);color:var(--fly-text-primary);line-height:1.7;-webkit-font-smoothing:antialiased;-moz-osx-font-smoothing:grayscale;font-size:16px;}}
+.gradio-container {{max-width:100% !important;width:100% !important;min-height:100vh;margin:0 auto !important;padding:0 !important;border-radius:0 !important;box-shadow:none !important;background:linear-gradient(170deg, #E0F2FE 0%, #F3E8FF 100%);display:flex;flex-direction:column;}}
+.app-title-card {{text-align:center;padding:2.5rem 1rem;margin:0;background:linear-gradient(135deg,var(--fly-primary) 0%,var(--fly-secondary) 100%);color:var(--fly-bg-white);border-bottom-left-radius:var(--radius-xl);border-bottom-right-radius:var(--radius-xl);box-shadow:var(--shadow-lg);position:relative;overflow:hidden;}}
+.app-title-card::before {{content:'';position:absolute;top:-50px;right:-50px;width:150px;height:150px;background:rgba(255,255,255,0.1);border-radius:var(--radius-full);opacity:0.5;transform:rotate(45deg);}}
+.app-title-card h1 {{font-size:2.25em !important;font-weight:800 !important;margin:0 0 0.5rem 0;font-family:var(--font-english);letter-spacing:-0.5px;text-shadow:0 2px 4px rgba(0,0,0,0.1);}}
+.app-title-card p {{font-size:1em !important;margin-top:0.25rem;font-weight:400;color:rgba(255,255,255,0.85) !important;}}
+.app-footer-fly {{text-align:center;font-size:0.85em;color:var(--fly-text-secondary);margin-top:2.5rem;padding:1rem 0;background-color:rgba(255,255,255,0.3);backdrop-filter:blur(5px);border-top:1px solid var(--fly-border-color);}}
+footer,.gradio-footer,.flagging-container,.flex.row.gap-2.absolute.bottom-2.right-2.gr-compact.gr-box.gr-text-gray-500,div[data-testid="flag"],button[title="Flag"],button[aria-label="Flag"],.footer-utils {{display:none !important;visibility:hidden !important;}}
+.main-content-area {{flex-grow:1;padding:0.75rem;width:100%;margin:0 auto;box-sizing:border-box;}}
+.content-panel-simple {{background-color:var(--fly-bg-white);padding:1rem;border-radius:var(--radius-xl);box-shadow:var(--shadow-xl);margin-top:-2rem;position:relative;z-index:10;margin-bottom:2rem;width:100%;box-sizing:border-box;}}
+.content-panel-simple .gr-button.lg.primary,.content-panel-simple button[variant="primary"] {{background:var(--fly-accent) !important;margin-top:1rem !important;padding:12px 20px !important;transition:all 0.25s ease-in-out !important;color:white !important;font-weight:600 !important;border-radius:10px !important;border:none !important;box-shadow:0 3px 8px -1px rgba(var(--fly-accent-rgb),0.3) !important;width:100% !important;font-size:1em !important;display:flex;align-items:center;justify-content:center;}}
+.content-panel-simple .gr-button.lg.primary:hover,.content-panel-simple button[variant="primary"]:hover {{background:#B45309 !important;transform:translateY(-1px) !important;box-shadow:0 5px 10px -1px rgba(var(--fly-accent-rgb),0.4) !important;}}
+.content-panel-simple .gr-input > label + div > textarea,.content-panel-simple .gr-dropdown > label + div > div > input,.content-panel-simple .gr-dropdown > label + div > div > select,.content-panel-simple .gr-textbox > label + div > textarea, .content-panel-simple .gr-file > label + div {{border-radius:8px !important;border:1.5px solid var(--fly-border-color) !important;font-size:0.95em !important;background-color:var(--fly-input-bg-simple) !important;padding:10px 12px !important;color:var(--fly-text-primary) !important;}}
+.content-panel-simple .gr-input > label + div > textarea:focus,.content-panel-simple .gr-dropdown > label + div > div > input:focus,.content-panel-simple .gr-dropdown > label + div > div > select:focus,.content-panel-simple .gr-textbox > label + div > textarea:focus, .content-panel-simple .gr-file > label + div:focus-within {{border-color:var(--fly-primary) !important;box-shadow:0 0 0 3px rgba(var(--fly-primary-rgb),0.12) !important;background-color:var(--fly-bg-white) !important;}}
+.content-panel-simple .gr-file > label + div {{ text-align:center; border-style: dashed !important; }}
+.content-panel-simple .gr-dropdown select {{font-family:var(--font-global) !important;width:100%;cursor:pointer;}}
+.content-panel-simple .gr-textbox[label*="وضعیت"] > label + div > textarea {{background-color:var(--fly-panel-bg-simple) !important;border-color:#A5D5FE !important;min-height:auto !important; /* Adjusted for single line */ font-family:var(--font-global);font-size:0.9em !important;line-height:1.5;padding:8px 10px !important;}}
+.content-panel-simple .gr-panel,.content-panel-simple div[label*="تنظیمات پیشرفته"] > .gr-accordion > .gr-panel {{border-radius:8px !important;border:1px solid var(--fly-border-color) !important;background-color:var(--fly-input-bg-simple) !important;padding:0.8rem 1rem !important;margin-top:0.6rem;box-shadow:none;}}
+.content-panel-simple div[label*="تنظیمات پیشرفته"] > .gr-accordion > button.gr-button {{font-weight:500 !important;padding:8px 10px !important;border-radius:6px !important;background-color:#E5E7EB !important;color:var(--fly-text-primary) !important;border:1px solid #D1D5DB !important;}}
+.content-panel-simple label > span.label-text {{font-weight:500 !important;color:#4B5563 !important;font-size:0.88em !important;margin-bottom:6px !important;display:inline-block;}}
+.content-panel-simple .gr-slider label span {{font-size:0.82em !important;color:var(--fly-text-secondary);}}
+.temp-description-tts {{ font-size: 0.82em !important; color: var(--fly-text-secondary) !important; margin-top: -0.5rem; margin-bottom: 1rem; padding-right: 5px; }}
+.content-panel-simple div[label*="نمونه"] {{margin-top:1.5rem;}}
+.content-panel-simple div[label*="نمونه"] .gr-button.gr-button-tool,.content-panel-simple div[label*="نمونه"] .gr-sample-button {{background-color:#E0E7FF !important;color:var(--fly-primary) !important;border-radius:6px !important;font-size:0.78em !important;padding:4px 8px !important;}}
+.content-panel-simple .custom-hr {{height:1px;background-color:var(--fly-border-color);margin:1.5rem 0;border:none;}}
+.api-warning-message {{background-color:#FFFBEB !important;color:#92400E !important;padding:10px 12px !important;border-radius:8px !important;border:1px solid #FDE68A !important;text-align:center !important;margin:0 0.2rem 1rem 0.2rem !important;font-size:0.85em !important;}}
+.content-panel-simple #output_audio_tts audio {{ width: 100%; border-radius: var(--radius-md); margin-top:0.5rem; }}
+@media (min-width:640px) {{.main-content-area {{padding:1.5rem;max-width:700px;}} .content-panel-simple {{padding:1.5rem;}} .app-title-card h1 {{font-size:2.5em !important;}} .app-title-card p {{font-size:1.05em !important;}} }}
+@media (min-width:768px) {{
+    .main-content-area {{max-width:780px;}} .content-panel-simple {{padding:2rem;}}
+    .content-panel-simple .main-content-row {{display:flex !important;flex-direction:row !important;gap:1.5rem !important;}}
+    .content-panel-simple .main-content-row > .gr-column:nth-child(1) {{flex-basis:60%; min-width:0;}}
+    .content-panel-simple .main-content-row > .gr-column:nth-child(2) {{flex-basis:40%; min-width:0;}}
+    .content-panel-simple .gr-button.lg.primary,.content-panel-simple button[variant="primary"] {{width:auto !important;align-self:flex-start;}}
+    .app-title-card h1 {{font-size:2.75em !important;}} .app-title-card p {{font-size:1.1em !important;}}
 }}
 """
+logging.info(f"Gradio version: {gr.__version__}")
+if not PYDUB_AVAILABLE:
+    logging.warning("Pydub (برای ادغام فایل‌های صوتی) یافت نشد. لطفاً با `pip install pydub` نصب کنید. در غیر این صورت، فقط اولین قطعه صوتی ارائه خواهد شد.")
+with gr.Blocks(theme=app_theme_outer, css=custom_css, title="آلفا TTS") as demo:
+    gr.HTML(f"""
+        <div class="app-title-card">
+            <h1>🚀 Alpha TTS</h1>
+            <p>جادوی تبدیل متن به صدا با هوش مصنوعی Gemini</p>
+        </div>
+    """)
+    with gr.Column(elem_classes=["main-content-area"]):
+        with gr.Group(elem_classes=["content-panel-simple"]):
+            if NUM_GEMINI_KEYS == 0:
+                missing_key_msg = (
+                    "⚠️ هشدار: قابلیت تبدیل متن به گفتار غیرفعال است. "
+                    "هیچ کلید API جیمینای (با فرمت GEMINI_API_KEY_1, ...) "
+                    "در بخش Secrets این Space یافت نشد. "
+                    "لطفاً حداقل یک کلید با نام GEMINI_API_KEY_1 تنظیم کنید."
+                )
+                gr.Markdown(f"<div class='api-warning-message'>{missing_key_msg}</div>")
+            status_message_output = gr.Textbox(label="وضعیت پردازش", interactive=False, lines=1, placeholder="پیام‌های وضعیت اینجا نمایش داده می‌شوند...")
+            with gr.Row(elem_classes=["main-content-row"]):
+                with gr.Column(scale=3):
+                    use_file_input_cb = gr.Checkbox(label="📄 استفاده از فایل متنی (.txt)", value=False)
+                    uploaded_file_input = gr.File(
+                        label="آپلود فایل متنی",
+                        file_types=['.txt'],
+                        visible=False
+                    )
+                    text_to_speak_tb = gr.Textbox(
+                        label="📝 متن فارسی برای تبدیل به گفتار",
+                        placeholder="مثال: سلام، به پروژه آلفا خوش آمدید.",
+                        lines=5,
+                        value=""
+                    )
+                    speech_prompt_tb = gr.Textbox(
+                        label="🗣️ سبک و زمینه گفتار (اختیاری)",
+                        placeholder="مثال: با لحنی شاد و پرانرژی",
+                        value="با لحنی دوستانه و رسا صحبت کن.",
+                        lines=2
+                    )
+                with gr.Column(scale=2):
+                    speaker_voice_dd = gr.Dropdown(
+                        SPEAKER_VOICES,
+                        label="🎤 انتخاب گوینده (توجه: ممکن است فعلا اعمال نشود)", # Added a note
+                        value="Charon"
+                    )
+                    temperature_slider = gr.Slider(
+                        minimum=0.1, maximum=1.5, step=0.05, value=0.9,
+                        label="🌡️ میزان خلاقیت صدا (دما)"
+                    )
+                    gr.Markdown("<p class='temp-description-tts'>مقادیر بالاتر = تنوع بیشتر، مقادیر پایین‌تر = یکنواختی بیشتر.</p>", elem_classes=["temp-description-tts-container"])
+                    output_audio = gr.Audio(label="🎧 فایل صوتی خروجی", type="filepath", elem_id="output_audio_tts")
+            generate_button = gr.Button("🚀 تولید و پخش صدا", variant="primary", elem_classes=["lg"])
+            gr.HTML("<hr class='custom-hr'>")
+            gr.Examples(
+                examples=[
+                    [False, None, "سلام بر شما، امیدوارم روز خوبی داشته باشید. این یک نمونه صدای تولید شده توسط آلفا است.", "با لحنی گرم و صمیمی.", "Zephyr", 0.85],
+                    [False, None, "این یک آزمایش برای بررسی کیفیت صدای تولید شده توسط هوش مصنوعی پیشرفته جیمینای است.", "با صدایی طبیعی، روان و کمی رسمی.", "Charon", 0.9],
+                    [False, None, "آیا می‌توانم یک پیتزای پپرونی سفارش دهم؟", "پرسشی و مودبانه.", "Achird", 0.75],
+                ],
+                inputs=[use_file_input_cb, uploaded_file_input, text_to_speak_tb, speech_prompt_tb, speaker_voice_dd, temperature_slider],
+                outputs=[output_audio, status_message_output],
+                fn=gradio_tts_interface,
+                cache_examples=os.getenv("GRADIO_CACHE_EXAMPLES", "False").lower() == "true",
+                label="💡 نمونه‌های کاربردی"
+            )
+    gr.Markdown("<p class='app-footer-fly'>Alpha TTS © 2024</p>")
+    def toggle_file_input(use_file):
+        if use_file:
+            return gr.update(visible=True, label=" "), gr.update(visible=False)
+        else:
+            return gr.update(visible=False), gr.update(visible=True, label="📝 متن فارسی برای تبدیل به گفتار")
+    use_file_input_cb.change(
+        fn=toggle_file_input,
+        inputs=use_file_input_cb,
+        outputs=[uploaded_file_input, text_to_speak_tb]
+    )
+    if generate_button is not None:
+         generate_button.click(
             fn=gradio_tts_interface,
+            inputs=[use_file_input_cb, uploaded_file_input, text_to_speak_tb, speech_prompt_tb, speaker_voice_dd, temperature_slider],
+            outputs=[output_audio, status_message_output]
         )
+    else:
+        logging.error("دکمه تولید صدا (generate_button) به درستی مقداردهی اولیه نشده است.")
 if __name__ == "__main__":
+    if os.getenv("AUTO_RESTART_ENABLED", "true").lower() == "true":
+        restart_scheduler_thread = threading.Thread(target=auto_restart_service, daemon=True)
+        restart_scheduler_thread.start()
+    demo.launch(
+        server_name="0.0.0.0",
+        server_port=int(os.getenv("PORT", 7860)),
+        debug=os.environ.get("GRADIO_DEBUG", "False").lower() == "true",
+        show_error=True
+    )