demo
Browse files
app.py
CHANGED
@@ -21,33 +21,9 @@ def predict(text, speaker):
|
|
21 |
if len(text.strip()) == 0:
|
22 |
return (16000, np.zeros(0).astype(np.int16))
|
23 |
|
24 |
-
|
25 |
-
input_ids = inputs["input_ids"]
|
26 |
-
input_ids = input_ids[..., :model.config.max_text_positions]
|
27 |
-
|
28 |
-
if speaker == "Surprise Me!":
|
29 |
-
# load one of the provided speaker embeddings at random
|
30 |
-
idx = np.random.randint(len(speaker_embeddings))
|
31 |
-
key = list(speaker_embeddings.keys())[idx]
|
32 |
-
speaker_embedding = np.load(speaker_embeddings[key])
|
33 |
-
|
34 |
-
# randomly shuffle the elements
|
35 |
-
np.random.shuffle(speaker_embedding)
|
36 |
-
|
37 |
-
# randomly flip half the values
|
38 |
-
x = (np.random.rand(512) >= 0.5) * 1.0
|
39 |
-
x[x == 0] = -1.0
|
40 |
-
speaker_embedding *= x
|
41 |
-
|
42 |
-
#speaker_embedding = np.random.rand(512).astype(np.float32) * 0.3 - 0.15
|
43 |
-
else:
|
44 |
-
speaker_embedding = np.load(speaker_embeddings[speaker[:3]])
|
45 |
-
|
46 |
speaker_embedding = torch.tensor(speaker_embedding).unsqueeze(0)
|
47 |
-
|
48 |
-
|
49 |
speech = synthesiser(text, forward_params={"speaker_embeddings": speaker_embedding})
|
50 |
-
|
51 |
speech = (speech.numpy() * 32767).astype(np.int16)
|
52 |
return (16000, speech)
|
53 |
|
@@ -72,7 +48,6 @@ gr.Interface(
|
|
72 |
"GGP (gwryw-gogledd-pro)",
|
73 |
"BGP (benyw-gogledd-pro)",
|
74 |
"BDP (benyw-de-pro)",
|
75 |
-
"Surprise Me!"
|
76 |
],
|
77 |
value="GGP (gwryw-gogledd-pro)"),
|
78 |
],
|
|
|
21 |
if len(text.strip()) == 0:
|
22 |
return (16000, np.zeros(0).astype(np.int16))
|
23 |
|
24 |
+
speaker_embedding = np.load(speaker_embeddings[speaker[:3]])
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
25 |
speaker_embedding = torch.tensor(speaker_embedding).unsqueeze(0)
|
|
|
|
|
26 |
speech = synthesiser(text, forward_params={"speaker_embeddings": speaker_embedding})
|
|
|
27 |
speech = (speech.numpy() * 32767).astype(np.int16)
|
28 |
return (16000, speech)
|
29 |
|
|
|
48 |
"GGP (gwryw-gogledd-pro)",
|
49 |
"BGP (benyw-gogledd-pro)",
|
50 |
"BDP (benyw-de-pro)",
|
|
|
51 |
],
|
52 |
value="GGP (gwryw-gogledd-pro)"),
|
53 |
],
|