Real_Time_diarization

Sleeping

App Files Files Community

Saiyaswanth007 commited on May 25

Commit

cba237d

1 Parent(s): 4562675

Check point 4

Browse files

Files changed (1) hide show

app.py +49 -12

app.py CHANGED Viewed

@@ -635,11 +635,12 @@ audio_handler = None
 def initialize_system():
     """Initialize the diarization system"""
-    global audio_handler
     try:
         success = diarization_system.initialize_models()
         if success:
-            audio_handler = DiarizationHandler(diarization_system)
             return "✅ System initialized successfully!"
         else:
             return "❌ Failed to initialize system. Check logs for details."
@@ -651,11 +652,14 @@ def start_recording():
     """Start recording and transcription"""
     try:
         result = diarization_system.start_recording()
-        # FastRTC connection is handled through the mounted stream
         return result
     except Exception as e:
         return f"❌ Failed to start recording: {str(e)}"
 def stop_recording():
     """Stop recording and transcription"""
     try:
@@ -702,11 +706,11 @@ def create_interface():
         with gr.Row():
             with gr.Column(scale=2):
-                # Add WebRTC component for audio streaming
-                audio_webrtc = WebRTC(
                     label="Audio Input",
-                    source_url="/stream",  # Connect to the FastRTC stream endpoint
-                    rtc_configuration={"iceServers": [{"urls": ["stun:stun.l.google.com:19302"]}]}
                 )
                 # Conversation display
@@ -782,7 +786,6 @@ def create_interface():
         def on_start():
             result = start_recording()
-            # FastRTC connection is handled through the mounted stream
             return result, gr.update(interactive=False), gr.update(interactive=True)
         def on_stop():
@@ -838,16 +841,50 @@ def create_interface():
         status_timer = gr.Timer(2)
         status_timer.tick(refresh_status, outputs=[status_output])
     return interface
 # FastAPI setup for FastRTC integration
 app = FastAPI()
-# Initialize audio handler for FastRTC
-audio_handler = DiarizationHandler(diarization_system)
-stream = Stream(handler=audio_handler, modality="audio", mode="send-receive")
-stream.mount(app)  # Mount the Stream to the FastAPI app
 @app.get("/")
 async def root():

 def initialize_system():
     """Initialize the diarization system"""
+    global stream
     try:
         success = diarization_system.initialize_models()
         if success:
+            # Update the Stream's handler to use our DiarizationHandler
+            stream.handler = DiarizationHandler(diarization_system)
             return "✅ System initialized successfully!"
         else:
             return "❌ Failed to initialize system. Check logs for details."
     """Start recording and transcription"""
     try:
         result = diarization_system.start_recording()
         return result
     except Exception as e:
         return f"❌ Failed to start recording: {str(e)}"
+def on_start():
+    result = start_recording()
+    return result, gr.update(interactive=False), gr.update(interactive=True)
 def stop_recording():
     """Stop recording and transcription"""
     try:
         with gr.Row():
             with gr.Column(scale=2):
+                # Replace WebRTC with standard Gradio audio component
+                audio_component = gr.Audio(
                     label="Audio Input",
+                    sources=["microphone"],
+                    streaming=True
                 )
                 # Conversation display
         def on_start():
             result = start_recording()
             return result, gr.update(interactive=False), gr.update(interactive=True)
         def on_stop():
         status_timer = gr.Timer(2)
         status_timer.tick(refresh_status, outputs=[status_output])
+        # Process audio from Gradio component
+        def process_audio_input(audio_data):
+            if audio_data is not None and diarization_system.is_running:
+                # Extract audio data
+                if isinstance(audio_data, tuple) and len(audio_data) >= 2:
+                    sample_rate, audio_array = audio_data[0], audio_data[1]
+                    diarization_system.process_audio_chunk(audio_array, sample_rate)
+            return get_conversation()
+        # Connect audio component to processing function
+        audio_component.stream(
+            fn=process_audio_input,
+            outputs=[conversation_output]
+        )
     return interface
 # FastAPI setup for FastRTC integration
 app = FastAPI()
+# Create a placeholder handler - will be properly initialized later
+class DefaultHandler(AsyncStreamHandler):
+    def __init__(self):
+        super().__init__()
+    async def receive(self, frame):
+        pass
+    async def emit(self):
+        return None
+    def copy(self):
+        return DefaultHandler()
+    async def shutdown(self):
+        pass
+    async def start_up(self):
+        pass
+# Initialize with placeholder handler
+stream = Stream(handler=DefaultHandler(), modality="audio", mode="send-receive")
+stream.mount(app)
 @app.get("/")
 async def root():