Spaces:
Runtime error
Runtime error
Update app.py
Browse files
app.py
CHANGED
@@ -38,7 +38,8 @@ def predict(text, preset):
|
|
38 |
input_ids = inputs["input_ids"]
|
39 |
input_ids = input_ids[..., :model.config.max_text_positions]
|
40 |
|
41 |
-
|
|
|
42 |
speaker_embedding = torch.tensor(speaker_embedding).unsqueeze(0)
|
43 |
speech = model.generate_speech(input_ids, speaker_embedding, vocoder=vocoder)
|
44 |
|
@@ -46,11 +47,10 @@ def predict(text, preset):
|
|
46 |
return (16000, speech)
|
47 |
|
48 |
|
49 |
-
title = "
|
50 |
|
51 |
description = """
|
52 |
-
|
53 |
-
By pre-training on text and speech at the same time, it learns unified representations for both, resulting in improved modeling capabilities.
|
54 |
"""
|
55 |
|
56 |
article = """
|
|
|
38 |
input_ids = inputs["input_ids"]
|
39 |
input_ids = input_ids[..., :model.config.max_text_positions]
|
40 |
|
41 |
+
# cmu_us_awb_arctic-wav-arctic_a0002.npy
|
42 |
+
speaker_embedding = np.load('spkemb/cmu_us_bdl_arctic-wav-arctic_a0009.npy', allow_pickle=True)
|
43 |
speaker_embedding = torch.tensor(speaker_embedding).unsqueeze(0)
|
44 |
speech = model.generate_speech(input_ids, speaker_embedding, vocoder=vocoder)
|
45 |
|
|
|
47 |
return (16000, speech)
|
48 |
|
49 |
|
50 |
+
title = "Create 423: News to Speech"
|
51 |
|
52 |
description = """
|
53 |
+
Create 423: News to Speech
|
|
|
54 |
"""
|
55 |
|
56 |
article = """
|