Spaces:
Running
Running
Update preprocessing.py
Browse files- preprocessing.py +0 -20
preprocessing.py
CHANGED
@@ -1,8 +1,6 @@
|
|
1 |
import os
|
2 |
from pydub import AudioSegment
|
3 |
import noisereduce as nr
|
4 |
-
import webrtcvad
|
5 |
-
from ..config import settings
|
6 |
import numpy as np
|
7 |
import librosa
|
8 |
import soundfile as sf
|
@@ -84,21 +82,3 @@ def clean_audio_streaming(input_file: str, output_file: Optional[str] = None, ch
|
|
84 |
except Exception as e:
|
85 |
print(f"Ses temizleme hatası: {str(e)}")
|
86 |
return input_file
|
87 |
-
|
88 |
-
def _apply_vad(audio: AudioSegment, vad: webrtcvad.Vad) -> AudioSegment:
|
89 |
-
frame_duration = 30
|
90 |
-
frames = []
|
91 |
-
samples = audio.get_array_of_samples()
|
92 |
-
for i in range(0, len(samples), int(settings.SAMPLE_RATE * frame_duration / 1000)):
|
93 |
-
frame = samples[i:i + int(settings.SAMPLE_RATE * frame_duration / 1000)]
|
94 |
-
is_speech = vad.is_speech(
|
95 |
-
frame.tobytes(), sample_rate=settings.SAMPLE_RATE
|
96 |
-
)
|
97 |
-
if is_speech:
|
98 |
-
frames.extend(frame)
|
99 |
-
return AudioSegment(
|
100 |
-
data=bytes(frames),
|
101 |
-
sample_width=audio.sample_width,
|
102 |
-
frame_rate=settings.SAMPLE_RATE,
|
103 |
-
channels=audio.channels
|
104 |
-
)
|
|
|
1 |
import os
|
2 |
from pydub import AudioSegment
|
3 |
import noisereduce as nr
|
|
|
|
|
4 |
import numpy as np
|
5 |
import librosa
|
6 |
import soundfile as sf
|
|
|
82 |
except Exception as e:
|
83 |
print(f"Ses temizleme hatası: {str(e)}")
|
84 |
return input_file
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|