Spaces:

Seicas
/

VoiceToWrite

Running

App Files Files Community

Seicas commited on Jun 18

Commit

f9b22e5

verified ·

1 Parent(s): 4a14d8c

Update app.py

Browse files

Files changed (1) hide show

app.py +43 -24

app.py CHANGED Viewed

@@ -10,6 +10,7 @@ from asr import transcribe_file
 from diarization import diarize_segments
 from privacy import MedicalPrivacyProcessor
 from config import settings
 # HuggingFace token'ını ayarla
 HF_TOKEN = os.getenv("HF_TOKEN", "")
@@ -60,36 +61,54 @@ css = """
 .tips {background: #e7f5ff; padding: 15px; border-radius: 5px; margin-top: 20px;}
 """
-def process_audio(audio_file, is_pediatrics=True):
-    """Process audio with improved error handling"""
-    try:
-        # Clean audio
-        cleaned_audio = clean_audio(audio_file)
-        # Transcribe
-        transcription = transcribe_file(cleaned_audio)
-        # Diarize
-        diarization = diarize_segments(transcription["segments"])
-        # Process text
-        nlp = load_spacy_model()
-        processed_text = process_text(transcription, nlp, is_pediatrics)
-        return {
-            "transcription": transcription,
-            "diarization": diarization,
-            "processed_text": processed_text
-        }
     except Exception as e:
-        print(f"Error processing audio: {e}")
-        return {
-            "error": str(e),
-            "transcription": "",
-            "diarization": [],
-            "processed_text": ""
-        }
 # Ana arayüz
 with gr.Blocks(theme=gr.themes.Soft(primary_hue="indigo", secondary_hue="blue"), css=css) as demo:

 from diarization import diarize_segments
 from privacy import MedicalPrivacyProcessor
 from config import settings
+from typing import Tuple, Dict
 # HuggingFace token'ını ayarla
 HF_TOKEN = os.getenv("HF_TOKEN", "")
 .tips {background: #e7f5ff; padding: 15px; border-radius: 5px; margin-top: 20px;}
 """
+def process_audio(
+    audio_path: str,
+    do_diarize: bool = True,
+    do_enhance: bool = True,
+    do_anonymize: bool = True
+) -> Tuple[str, Dict]:
+    """
+    Ses dosyasını işleyip transkripsiyon yapar.
+    Args:
+        audio_path: Ses dosyasının yolu
+        do_diarize: Konuşmacı ayrımı yapılsın mı?
+        do_enhance: Ses iyileştirme yapılsın mı?
+        do_anonymize: Kişisel veriler anonimleştirilsin mi?
+    Returns:
+        Tuple[str, Dict]: (Transkripsiyon metni, JSON sonuç)
+    """
+    if not audio_path:
+        return "Lütfen bir ses dosyası yükleyin.", {}
+    try:
+        # Ses dosyasını yükle
+        audio = Audio.from_file(audio_path)
+        # Ses iyileştirme
+        if do_enhance:
+            audio = enhance_audio(audio)
+        # Konuşmacı ayrımı
+        if do_diarize:
+            diarization = diarize_speakers(audio)
+        else:
+            diarization = None
+        # Transkripsiyon
+        result = transcribe_audio(audio, diarization)
+        # Anonimleştirme
+        if do_anonymize:
+            result = anonymize_personal_info(result)
+        return result["text"], result
     except Exception as e:
+        error_msg = f"İşlem sırasında bir hata oluştu: {str(e)}"
+        print(error_msg)
+        return error_msg, {}
 # Ana arayüz
 with gr.Blocks(theme=gr.themes.Soft(primary_hue="indigo", secondary_hue="blue"), css=css) as demo: