kennethli319 commited on
Commit
09e6eb0
·
1 Parent(s): 462cad0

update tts

Browse files
Files changed (1) hide show
  1. app.py +5 -5
app.py CHANGED
@@ -25,18 +25,18 @@ def generate_tts(text: str, speaker: int = 0):
25
  spectrogram = spec_generator.generate_spectrogram(tokens=parsed, speaker=speaker)
26
  audio = voc_model.convert_spectrogram_to_audio(spec=spectrogram)
27
 
28
- with tempfile.NamedTemporaryFile(suffix=".wav", delete=False) as fp:
29
- torchaudio.save(fp.name, audio.to('cpu'), sample_rate=sr)
30
 
31
- return fp.name
32
- #return (sr, audio.to('cpu').detach().numpy())
33
 
34
  def run():
35
  demo = gr.Interface(
36
  fn=generate_tts,
37
  inputs=[gr.Textbox(value="This is a test.", label="Text to Synthesize"),
38
  gr.Slider(0, 10, step=1, label="Speaker")],
39
- outputs=gr.Audio(label="Output", type="filepath"),
40
  )
41
 
42
  demo.launch(server_name="0.0.0.0", server_port=7860)
 
25
  spectrogram = spec_generator.generate_spectrogram(tokens=parsed, speaker=speaker)
26
  audio = voc_model.convert_spectrogram_to_audio(spec=spectrogram)
27
 
28
+ # with tempfile.NamedTemporaryFile(suffix=".wav", delete=False) as fp:
29
+ # torchaudio.save(fp.name, audio.to('cpu'), sample_rate=sr)
30
 
31
+ # return fp.name
32
+ return (sr, audio.to('cpu').detach().numpy())
33
 
34
  def run():
35
  demo = gr.Interface(
36
  fn=generate_tts,
37
  inputs=[gr.Textbox(value="This is a test.", label="Text to Synthesize"),
38
  gr.Slider(0, 10, step=1, label="Speaker")],
39
+ outputs=gr.Audio(label="Output", type="numpy"),
40
  )
41
 
42
  demo.launch(server_name="0.0.0.0", server_port=7860)