Real_Time_diarization

Sleeping

App Files Files Community

Saiyaswanth007 commited on May 25

Commit

4562675

1 Parent(s): 8df75a7

Check point 4

Browse files

Files changed (1) hide show

app.py +9 -25

app.py CHANGED Viewed

@@ -651,8 +651,7 @@ def start_recording():
     """Start recording and transcription"""
     try:
         result = diarization_system.start_recording()
-        # Connect WebRTC to server stream
-        audio_webrtc.stream_url = "/stream"  # This is your FastRTC endpoint
         return result
     except Exception as e:
         return f"❌ Failed to start recording: {str(e)}"
@@ -706,7 +705,7 @@ def create_interface():
                 # Add WebRTC component for audio streaming
                 audio_webrtc = WebRTC(
                     label="Audio Input",
-                    streaming=True,
                     rtc_configuration={"iceServers": [{"urls": ["stun:stun.l.google.com:19302"]}]}
                 )
@@ -783,8 +782,7 @@ def create_interface():
         def on_start():
             result = start_recording()
-            # Connect WebRTC to server stream
-            audio_webrtc.stream_url = "/stream"  # This is your FastRTC endpoint
             return result, gr.update(interactive=False), gr.update(interactive=True)
         def on_stop():
@@ -840,19 +838,17 @@ def create_interface():
         status_timer = gr.Timer(2)
         status_timer.tick(refresh_status, outputs=[status_output])
-        # After creating the WebRTC component:
-        audio_webrtc.stream(
-            fn=process_webrtc_audio,
-            inputs=[audio_webrtc],
-            outputs=[conversation_output]
-        )
     return interface
 # FastAPI setup for FastRTC integration
 app = FastAPI()
 @app.get("/")
 async def root():
     return {"message": "Real-time Speaker Diarization API"}
@@ -894,12 +890,6 @@ async def api_update_settings(threshold: float, max_speakers: int):
     result = update_settings(threshold, max_speakers)
     return {"result": result}
-# FastRTC Stream setup
-if audio_handler:
-    stream = Stream(handler=audio_handler)
-    app.include_router(stream.router, prefix="/stream")
 # Main execution
 if __name__ == "__main__":
     import argparse
@@ -959,10 +949,4 @@ if __name__ == "__main__":
         api_thread.start()
         # Start Gradio in main thread
-        run_gradio()
-def process_webrtc_audio(frames):
-    # Process frames and send them to your diarization system
-    for frame in frames:
-        diarization_system.process_audio_chunk(frame)
-    return get_conversation()

     """Start recording and transcription"""
     try:
         result = diarization_system.start_recording()
+        # FastRTC connection is handled through the mounted stream
         return result
     except Exception as e:
         return f"❌ Failed to start recording: {str(e)}"
                 # Add WebRTC component for audio streaming
                 audio_webrtc = WebRTC(
                     label="Audio Input",
+                    source_url="/stream",  # Connect to the FastRTC stream endpoint
                     rtc_configuration={"iceServers": [{"urls": ["stun:stun.l.google.com:19302"]}]}
                 )
         def on_start():
             result = start_recording()
+            # FastRTC connection is handled through the mounted stream
             return result, gr.update(interactive=False), gr.update(interactive=True)
         def on_stop():
         status_timer = gr.Timer(2)
         status_timer.tick(refresh_status, outputs=[status_output])
     return interface
 # FastAPI setup for FastRTC integration
 app = FastAPI()
+# Initialize audio handler for FastRTC
+audio_handler = DiarizationHandler(diarization_system)
+stream = Stream(handler=audio_handler, modality="audio", mode="send-receive")
+stream.mount(app)  # Mount the Stream to the FastAPI app
 @app.get("/")
 async def root():
     return {"message": "Real-time Speaker Diarization API"}
     result = update_settings(threshold, max_speakers)
     return {"result": result}
 # Main execution
 if __name__ == "__main__":
     import argparse
         api_thread.start()
         # Start Gradio in main thread
+        run_gradio()