kennethli319 commited on
Commit
9383bb1
·
1 Parent(s): e3064ab

update tts

Browse files
Files changed (1) hide show
  1. app.py +2 -1
app.py CHANGED
@@ -8,6 +8,7 @@ from nemo.collections.tts.models import MixerTTSModel
8
 
9
  spec_generator = FastPitchModel.from_pretrained("tts_en_fastpitch_multispeaker")
10
  voc_model = HifiGanModel.from_pretrained(model_name="tts_en_hifitts_hifigan_ft_fastpitch")
 
11
 
12
  def greet(name):
13
  return "Hello " + name + "!!"
@@ -17,7 +18,7 @@ def generate_tts(text: str, speaker: int = 0):
17
  parsed = spec_generator.parse(text)
18
  spectrogram = spec_generator.generate_spectrogram(tokens=parsed, speaker=speaker)
19
  audio = voc_model.convert_spectrogram_to_audio(spec=spectrogram)
20
- return sr, audio
21
 
22
  def run():
23
  demo = gr.Interface(
 
8
 
9
  spec_generator = FastPitchModel.from_pretrained("tts_en_fastpitch_multispeaker")
10
  voc_model = HifiGanModel.from_pretrained(model_name="tts_en_hifitts_hifigan_ft_fastpitch")
11
+ voc_model.eval()
12
 
13
  def greet(name):
14
  return "Hello " + name + "!!"
 
18
  parsed = spec_generator.parse(text)
19
  spectrogram = spec_generator.generate_spectrogram(tokens=parsed, speaker=speaker)
20
  audio = voc_model.convert_spectrogram_to_audio(spec=spectrogram)
21
+ return sr, audio.to('cpu').detach().numpy()
22
 
23
  def run():
24
  demo = gr.Interface(