dev-mode-python

Paused

App Files Files

Tomtom84 commited on Apr 13

Commit

323d1a0

1 Parent(s): ad94d02

upd4

Browse files

Files changed (2) hide show

__pycache__/app.cpython-312.pyc +0 -0
app.py +29 -27

__pycache__/app.cpython-312.pyc CHANGED Viewed

Binary files a/__pycache__/app.cpython-312.pyc and b/__pycache__/app.cpython-312.pyc differ

app.py CHANGED Viewed

@@ -1,46 +1,48 @@
-from fastapi import FastAPI
 import outetts
-import os
 # Initialize the interface
 interface = outetts.Interface(
     config=outetts.ModelConfig.auto_config(
         model=outetts.Models.VERSION_1_0_SIZE_1B,
-        # For llama.cpp backend
         backend=outetts.Backend.LLAMACPP,
         quantization=outetts.LlamaCppQuantization.FP16
-        # For transformers backend
-        #backend=outetts.Backend.HF,
     )
 )
 # Load the default speaker profile
 speaker = interface.load_default_speaker("EN-FEMALE-1-NEUTRAL")
-# Or create your own speaker profiles in seconds and reuse them instantly
-# speaker = interface.create_speaker("path/to/audio.wav")
-# interface.save_speaker(speaker, "speaker.json")
-# speaker = interface.load_speaker("speaker.json")
-# Generate speech
-output = interface.generate(
-    config=outetts.GenerationConfig(
-        text="Hello, how are you doing?",
-        generation_type=outetts.GenerationType.CHUNKED,
-        speaker=speaker,
-        sampler_config=outetts.SamplerConfig(
-            temperature=0.4
-        ),
-    )
-)
-# Save to file
-output_path = os.path.join(os.getcwd(),"output.wav")
-output.save(output_path)
 app = FastAPI()
 @app.get("/")
 def greet_json():
     return {"Hello": "World!"}

+from fastapi import FastAPI, WebSocket, WebSocketDisconnect
 import outetts
+import io
 # Initialize the interface
 interface = outetts.Interface(
     config=outetts.ModelConfig.auto_config(
         model=outetts.Models.VERSION_1_0_SIZE_1B,
         backend=outetts.Backend.LLAMACPP,
         quantization=outetts.LlamaCppQuantization.FP16
     )
 )
 # Load the default speaker profile
 speaker = interface.load_default_speaker("EN-FEMALE-1-NEUTRAL")
 app = FastAPI()
 @app.get("/")
 def greet_json():
     return {"Hello": "World!"}
+@app.websocket("/ws/tts")
+async def websocket_tts(websocket: WebSocket):
+    await websocket.accept()
+    try:
+        while True:
+            # Empfange Text-Chunk vom Client
+            data = await websocket.receive_text()
+            # Generiere Audio aus Text
+            output = interface.generate(
+                config=outetts.GenerationConfig(
+                    text=data,
+                    generation_type=outetts.GenerationType.CHUNKED,
+                    speaker=speaker,
+                    sampler_config=outetts.SamplerConfig(
+                        temperature=0.4
+                    ),
+                )
+            )
+            # Schreibe Audio in BytesIO
+            audio_buffer = io.BytesIO()
+            output.save(audio_buffer)
+            audio_bytes = audio_buffer.getvalue()
+            # Sende Audiodaten als Bytes zurück
+            await websocket.send_bytes(audio_bytes)
+    except WebSocketDisconnect:
+        pass