kennethli319 commited on
Commit
a6dfc58
·
1 Parent(s): 3f6ca44

update tts

Browse files
Files changed (1) hide show
  1. app.py +7 -3
app.py CHANGED
@@ -1,9 +1,13 @@
1
  import gradio as gr
2
  from nemo.collections.tts.models import FastPitchModel
3
  from nemo.collections.tts.models import HifiGanModel
 
 
 
 
4
 
5
  spec_generator = FastPitchModel.from_pretrained("tts_en_fastpitch_multispeaker")
6
- tts_model = HifiGanModel.from_pretrained(model_name="tts_en_hifitts_hifigan_ft_fastpitch")
7
 
8
  def greet(name):
9
  return "Hello " + name + "!!"
@@ -12,12 +16,12 @@ def generate_tts(text: str, speaker: int = 0):
12
  sr = 22050
13
  parsed = spec_generator.parse(text)
14
  spectrogram = spec_generator.generate_spectrogram(tokens=parsed, speaker=speaker)
15
- audio = tts_model.convert_spectrogram_to_audio(spec=spectrogram)
16
  return sr, audio
17
 
18
  def run():
19
  demo = gr.Interface(
20
- fn=greet,
21
  inputs=["text",
22
  gr.Slider(0, 10, step=1)],
23
  outputs="audio",
 
1
  import gradio as gr
2
  from nemo.collections.tts.models import FastPitchModel
3
  from nemo.collections.tts.models import HifiGanModel
4
+ from nemo.collections.tts.models import MixerTTSModel
5
+
6
+ # spec_generator_2 = MixerTTSModel.from_pretrained("tts_en_lj_mixerttsx")
7
+ # model1 = HifiGanModel.from_pretrained(model_name="tts_en_lj_hifigan_ft_mixerttsx")
8
 
9
  spec_generator = FastPitchModel.from_pretrained("tts_en_fastpitch_multispeaker")
10
+ voc_model = HifiGanModel.from_pretrained(model_name="tts_en_hifitts_hifigan_ft_fastpitch")
11
 
12
  def greet(name):
13
  return "Hello " + name + "!!"
 
16
  sr = 22050
17
  parsed = spec_generator.parse(text)
18
  spectrogram = spec_generator.generate_spectrogram(tokens=parsed, speaker=speaker)
19
+ audio = voc_model.convert_spectrogram_to_audio(spec=spectrogram)
20
  return sr, audio
21
 
22
  def run():
23
  demo = gr.Interface(
24
+ fn=generate_tts,
25
  inputs=["text",
26
  gr.Slider(0, 10, step=1)],
27
  outputs="audio",