trysem camenduru commited on
Commit
858cafb
·
0 Parent(s):

Duplicate from camenduru/one-shot-talking-face

Browse files

Co-authored-by: camenduru <[email protected]>

.gitattributes ADDED
@@ -0,0 +1,36 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ *.7z filter=lfs diff=lfs merge=lfs -text
2
+ *.arrow filter=lfs diff=lfs merge=lfs -text
3
+ *.bin filter=lfs diff=lfs merge=lfs -text
4
+ *.bz2 filter=lfs diff=lfs merge=lfs -text
5
+ *.ckpt filter=lfs diff=lfs merge=lfs -text
6
+ *.ftz filter=lfs diff=lfs merge=lfs -text
7
+ *.gz filter=lfs diff=lfs merge=lfs -text
8
+ *.h5 filter=lfs diff=lfs merge=lfs -text
9
+ *.joblib filter=lfs diff=lfs merge=lfs -text
10
+ *.lfs.* filter=lfs diff=lfs merge=lfs -text
11
+ *.mlmodel filter=lfs diff=lfs merge=lfs -text
12
+ *.model filter=lfs diff=lfs merge=lfs -text
13
+ *.msgpack filter=lfs diff=lfs merge=lfs -text
14
+ *.npy filter=lfs diff=lfs merge=lfs -text
15
+ *.npz filter=lfs diff=lfs merge=lfs -text
16
+ *.onnx filter=lfs diff=lfs merge=lfs -text
17
+ *.ot filter=lfs diff=lfs merge=lfs -text
18
+ *.parquet filter=lfs diff=lfs merge=lfs -text
19
+ *.pb filter=lfs diff=lfs merge=lfs -text
20
+ *.pickle filter=lfs diff=lfs merge=lfs -text
21
+ *.pkl filter=lfs diff=lfs merge=lfs -text
22
+ *.pt filter=lfs diff=lfs merge=lfs -text
23
+ *.pth filter=lfs diff=lfs merge=lfs -text
24
+ *.rar filter=lfs diff=lfs merge=lfs -text
25
+ *.safetensors filter=lfs diff=lfs merge=lfs -text
26
+ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
27
+ *.tar.* filter=lfs diff=lfs merge=lfs -text
28
+ *.tflite filter=lfs diff=lfs merge=lfs -text
29
+ *.tgz filter=lfs diff=lfs merge=lfs -text
30
+ *.wasm filter=lfs diff=lfs merge=lfs -text
31
+ *.xz filter=lfs diff=lfs merge=lfs -text
32
+ *.zip filter=lfs diff=lfs merge=lfs -text
33
+ *.zst filter=lfs diff=lfs merge=lfs -text
34
+ *tfevents* filter=lfs diff=lfs merge=lfs -text
35
+ examples/obama2.wav filter=lfs diff=lfs merge=lfs -text
36
+ examples/trump.wav filter=lfs diff=lfs merge=lfs -text
Dockerfile ADDED
@@ -0,0 +1,35 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ # https://gitlab.com/nvidia/container-images/cuda/-/blob/master/dist/11.2.1/ubuntu2004/devel/cudnn8/Dockerfile
2
+ FROM nvidia/cuda:11.2.1-cudnn8-devel-ubuntu20.04
3
+ ENV DEBIAN_FRONTEND noninteractive
4
+
5
+ WORKDIR /content
6
+ RUN apt-get update -y && apt-get upgrade -y && apt-get install -y sudo && apt-get install -y python3-pip && pip3 install --upgrade pip
7
+ RUN apt-get install -y gnupg wget htop sudo git git-lfs software-properties-common build-essential cmake curl
8
+ RUN apt-get install -y ffmpeg libavcodec-dev libavformat-dev libavdevice-dev libgl1 libgtk2.0-0 jq libdc1394-22-dev libraw1394-dev libopenblas-base
9
+
10
+ ENV PATH="/home/admin/.local/bin:${PATH}"
11
+
12
+ RUN pip3 install pandas scipy matplotlib torch torchvision torchaudio gradio altair imageio-ffmpeg pocketsphinx jq "numpy<1.24"
13
+
14
+ RUN git lfs install
15
+ RUN git clone https://huggingface.co/camenduru/pocketsphinx-20.04-t4 pocketsphinx && cd pocketsphinx && cmake --build build --target install
16
+
17
+ RUN git clone https://huggingface.co/camenduru/one-shot-talking-face-20.04-t4 one-shot-talking-face && cd one-shot-talking-face && pip install -r requirements.txt && chmod 755 OpenFace/FeatureExtraction
18
+ RUN mkdir /content/out
19
+
20
+ COPY app.py /content/app.py
21
+ COPY examples /content/examples
22
+
23
+ RUN adduser --disabled-password --gecos '' admin
24
+ RUN adduser admin sudo
25
+ RUN echo '%sudo ALL=(ALL) NOPASSWD:ALL' >> /etc/sudoers
26
+
27
+ RUN chown -R admin:admin /content
28
+ RUN chmod -R 777 /content
29
+ RUN chown -R admin:admin /home
30
+ RUN chmod -R 777 /home
31
+ USER admin
32
+
33
+ EXPOSE 7860
34
+
35
+ CMD ["python3", "app.py"]
README.md ADDED
@@ -0,0 +1,11 @@
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ title: One Shot Talking Face
3
+ emoji: 🌞
4
+ colorFrom: blue
5
+ colorTo: blue
6
+ sdk: docker
7
+ sdk_version: 3.9
8
+ app_file: oh-no.py
9
+ pinned: false
10
+ duplicated_from: camenduru/one-shot-talking-face
11
+ ---
app.py ADDED
@@ -0,0 +1,66 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ import gradio as gr
2
+ import os, subprocess, torchaudio
3
+ import torch
4
+ from PIL import Image
5
+
6
+ block = gr.Blocks()
7
+
8
+ def pad_image(image):
9
+ w, h = image.size
10
+ if w == h:
11
+ return image
12
+ elif w > h:
13
+ new_image = Image.new(image.mode, (w, w), (0, 0, 0))
14
+ new_image.paste(image, (0, (w - h) // 2))
15
+ return new_image
16
+ else:
17
+ new_image = Image.new(image.mode, (h, h), (0, 0, 0))
18
+ new_image.paste(image, ((h - w) // 2, 0))
19
+ return new_image
20
+
21
+ def calculate(image_in, audio_in):
22
+ waveform, sample_rate = torchaudio.load(audio_in)
23
+ waveform = torch.mean(waveform, dim=0, keepdim=True)
24
+ torchaudio.save("/content/audio.wav", waveform, sample_rate, encoding="PCM_S", bits_per_sample=16)
25
+ image = Image.open(image_in)
26
+ image = pad_image(image)
27
+ image.save("image.png")
28
+
29
+ pocketsphinx_run = subprocess.run(['pocketsphinx', '-phone_align', 'yes', 'single', '/content/audio.wav'], check=True, capture_output=True)
30
+ jq_run = subprocess.run(['jq', '[.w[]|{word: (.t | ascii_upcase | sub("<S>"; "sil") | sub("<SIL>"; "sil") | sub("\\\(2\\\)"; "") | sub("\\\(3\\\)"; "") | sub("\\\(4\\\)"; "") | sub("\\\[SPEECH\\\]"; "SIL") | sub("\\\[NOISE\\\]"; "SIL")), phones: [.w[]|{ph: .t | sub("\\\+SPN\\\+"; "SIL") | sub("\\\+NSN\\\+"; "SIL"), bg: (.b*100)|floor, ed: (.b*100+.d*100)|floor}]}]'], input=pocketsphinx_run.stdout, capture_output=True)
31
+ with open("test.json", "w") as f:
32
+ f.write(jq_run.stdout.decode('utf-8').strip())
33
+
34
+ os.system(f"cd /content/one-shot-talking-face && python3 -B test_script.py --img_path /content/image.png --audio_path /content/audio.wav --phoneme_path /content/test.json --save_dir /content/train")
35
+ return "/content/train/image_audio.mp4"
36
+
37
+ def run():
38
+ with block:
39
+ gr.Markdown(
40
+ """
41
+ <style> body { text-align: right} </style>
42
+ map: 📄 [arxiv](https://arxiv.org/abs/2112.02749) &nbsp; ⇨ 👩‍💻 [github](https://github.com/FuxiVirtualHuman/AAAI22-one-shot-talking-face) &nbsp; ⇨ 🦒 [colab](https://github.com/camenduru/one-shot-talking-face-colab) &nbsp; ⇨ 🤗 [huggingface](https://huggingface.co/spaces/camenduru/one-shot-talking-face) &nbsp; | &nbsp; tools: 🌀 [duplicate this space](https://huggingface.co/spaces/camenduru/sandbox?duplicate=true) &nbsp; | 🐢 [tortoise tts](https://huggingface.co/spaces/mdnestor/tortoise) &nbsp; | 🎨 [text-to-image](https://huggingface.co/models?pipeline_tag=text-to-image&sort=downloads) &nbsp; | 🐣 [twitter](https://twitter.com/camenduru) &nbsp;
43
+ """)
44
+ with gr.Group():
45
+ with gr.Box():
46
+ with gr.Row().style(equal_height=True):
47
+ image_in = gr.Image(show_label=False, type="filepath")
48
+ audio_in = gr.Audio(show_label=False, type='filepath')
49
+ video_out = gr.Video(show_label=False)
50
+ with gr.Row().style(equal_height=True):
51
+ btn = gr.Button("Generate")
52
+
53
+ examples = gr.Examples(examples=[
54
+ ["./examples/monalisa.jpg", "./examples/obama2.wav"],
55
+ ["./examples/monalisa.jpg", "./examples/trump.wav"],
56
+ ["./examples/o2.jpg", "./examples/obama2.wav"],
57
+ ["./examples/o2.jpg", "./examples/trump.wav" ],
58
+ ["./examples/image.png", "./examples/audio.wav"],
59
+ ], fn=calculate, inputs=[image_in, audio_in], outputs=[video_out], cache_examples=True)
60
+
61
+ btn.click(calculate, inputs=[image_in, audio_in], outputs=[video_out])
62
+ block.queue()
63
+ block.launch(server_name="0.0.0.0", server_port=7860)
64
+
65
+ if __name__ == "__main__":
66
+ run()
audio.wav ADDED
Binary file (608 kB). View file
 
examples/audio.wav ADDED
Binary file (608 kB). View file
 
examples/image.png ADDED
examples/monalisa.jpg ADDED
examples/o2.jpg ADDED
examples/obama2.wav ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8d59c8e469bda05ae7a7435420322c8a192b75ab44e7dc694a81b81512a36542
3
+ size 1280078
examples/trump.wav ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cb718f7537230f1c8a24fae2ec28eb56381f20ce25140d0b16a4dd1873de5a86
3
+ size 1856140
image.png ADDED
oh-no.py ADDED
@@ -0,0 +1,14 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ import gradio as gr
2
+
3
+ block = gr.Blocks()
4
+
5
+ def run():
6
+ with block:
7
+ gr.Markdown(
8
+ """
9
+ <p>oh no 😐 something wrong with the 🤗 hugging face servers 😐 hopefully, it will be fixed soon</p>
10
+ """)
11
+ block.launch(server_name="0.0.0.0", server_port=7860)
12
+
13
+ if __name__ == "__main__":
14
+ run()
test.json ADDED
@@ -0,0 +1,977 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ [
2
+ {
3
+ "word": "sil",
4
+ "phones": [
5
+ {
6
+ "ph": "SIL",
7
+ "bg": 0,
8
+ "ed": 18
9
+ }
10
+ ]
11
+ },
12
+ {
13
+ "word": "I",
14
+ "phones": [
15
+ {
16
+ "ph": "AY",
17
+ "bg": 18,
18
+ "ed": 21
19
+ }
20
+ ]
21
+ },
22
+ {
23
+ "word": "WANT",
24
+ "phones": [
25
+ {
26
+ "ph": "W",
27
+ "bg": 21,
28
+ "ed": 33
29
+ },
30
+ {
31
+ "ph": "AO",
32
+ "bg": 33,
33
+ "ed": 48
34
+ },
35
+ {
36
+ "ph": "N",
37
+ "bg": 48,
38
+ "ed": 60
39
+ },
40
+ {
41
+ "ph": "T",
42
+ "bg": 60,
43
+ "ed": 65
44
+ }
45
+ ]
46
+ },
47
+ {
48
+ "word": "TO",
49
+ "phones": [
50
+ {
51
+ "ph": "T",
52
+ "bg": 65,
53
+ "ed": 74
54
+ },
55
+ {
56
+ "ph": "UW",
57
+ "bg": 74,
58
+ "ed": 80
59
+ }
60
+ ]
61
+ },
62
+ {
63
+ "word": "LOSE",
64
+ "phones": [
65
+ {
66
+ "ph": "L",
67
+ "bg": 80,
68
+ "ed": 87
69
+ },
70
+ {
71
+ "ph": "UW",
72
+ "bg": 87,
73
+ "ed": 121
74
+ },
75
+ {
76
+ "ph": "Z",
77
+ "bg": 121,
78
+ "ed": 150
79
+ }
80
+ ]
81
+ },
82
+ {
83
+ "word": "SIL",
84
+ "phones": [
85
+ {
86
+ "ph": "SIL",
87
+ "bg": 150,
88
+ "ed": 158
89
+ }
90
+ ]
91
+ },
92
+ {
93
+ "word": "sil",
94
+ "phones": [
95
+ {
96
+ "ph": "SIL",
97
+ "bg": 158,
98
+ "ed": 250
99
+ }
100
+ ]
101
+ },
102
+ {
103
+ "word": "TO",
104
+ "phones": [
105
+ {
106
+ "ph": "T",
107
+ "bg": 250,
108
+ "ed": 255
109
+ },
110
+ {
111
+ "ph": "UW",
112
+ "bg": 254,
113
+ "ed": 276
114
+ }
115
+ ]
116
+ },
117
+ {
118
+ "word": "TO",
119
+ "phones": [
120
+ {
121
+ "ph": "T",
122
+ "bg": 276,
123
+ "ed": 302
124
+ },
125
+ {
126
+ "ph": "AH",
127
+ "bg": 302,
128
+ "ed": 328
129
+ }
130
+ ]
131
+ },
132
+ {
133
+ "word": "sil",
134
+ "phones": [
135
+ {
136
+ "ph": "SIL",
137
+ "bg": 328,
138
+ "ed": 337
139
+ }
140
+ ]
141
+ },
142
+ {
143
+ "word": "KEEP",
144
+ "phones": [
145
+ {
146
+ "ph": "K",
147
+ "bg": 337,
148
+ "ed": 364
149
+ },
150
+ {
151
+ "ph": "IY",
152
+ "bg": 364,
153
+ "ed": 367
154
+ },
155
+ {
156
+ "ph": "P",
157
+ "bg": 367,
158
+ "ed": 375
159
+ }
160
+ ]
161
+ },
162
+ {
163
+ "word": "YOU",
164
+ "phones": [
165
+ {
166
+ "ph": "Y",
167
+ "bg": 375,
168
+ "ed": 382
169
+ },
170
+ {
171
+ "ph": "UW",
172
+ "bg": 382,
173
+ "ed": 385
174
+ }
175
+ ]
176
+ },
177
+ {
178
+ "word": "sil",
179
+ "phones": [
180
+ {
181
+ "ph": "SIL",
182
+ "bg": 385,
183
+ "ed": 392
184
+ }
185
+ ]
186
+ },
187
+ {
188
+ "word": "sil",
189
+ "phones": [
190
+ {
191
+ "ph": "SIL",
192
+ "bg": 392,
193
+ "ed": 446
194
+ }
195
+ ]
196
+ },
197
+ {
198
+ "word": "sil",
199
+ "phones": [
200
+ {
201
+ "ph": "SIL",
202
+ "bg": 446,
203
+ "ed": 475
204
+ }
205
+ ]
206
+ },
207
+ {
208
+ "word": "TRUST",
209
+ "phones": [
210
+ {
211
+ "ph": "T",
212
+ "bg": 475,
213
+ "ed": 482
214
+ },
215
+ {
216
+ "ph": "R",
217
+ "bg": 482,
218
+ "ed": 491
219
+ },
220
+ {
221
+ "ph": "AH",
222
+ "bg": 491,
223
+ "ed": 495
224
+ },
225
+ {
226
+ "ph": "S",
227
+ "bg": 495,
228
+ "ed": 506
229
+ },
230
+ {
231
+ "ph": "T",
232
+ "bg": 505,
233
+ "ed": 516
234
+ }
235
+ ]
236
+ },
237
+ {
238
+ "word": "sil",
239
+ "phones": [
240
+ {
241
+ "ph": "SIL",
242
+ "bg": 516,
243
+ "ed": 523
244
+ }
245
+ ]
246
+ },
247
+ {
248
+ "word": "GROUP",
249
+ "phones": [
250
+ {
251
+ "ph": "G",
252
+ "bg": 523,
253
+ "ed": 529
254
+ },
255
+ {
256
+ "ph": "R",
257
+ "bg": 529,
258
+ "ed": 532
259
+ },
260
+ {
261
+ "ph": "UW",
262
+ "bg": 532,
263
+ "ed": 546
264
+ },
265
+ {
266
+ "ph": "P",
267
+ "bg": 546,
268
+ "ed": 553
269
+ }
270
+ ]
271
+ },
272
+ {
273
+ "word": "SCHWARTZ",
274
+ "phones": [
275
+ {
276
+ "ph": "SH",
277
+ "bg": 553,
278
+ "ed": 564
279
+ },
280
+ {
281
+ "ph": "W",
282
+ "bg": 564,
283
+ "ed": 583
284
+ },
285
+ {
286
+ "ph": "AO",
287
+ "bg": 583,
288
+ "ed": 624
289
+ },
290
+ {
291
+ "ph": "R",
292
+ "bg": 624,
293
+ "ed": 628
294
+ },
295
+ {
296
+ "ph": "T",
297
+ "bg": 628,
298
+ "ed": 636
299
+ },
300
+ {
301
+ "ph": "S",
302
+ "bg": 636,
303
+ "ed": 639
304
+ }
305
+ ]
306
+ },
307
+ {
308
+ "word": "YOU",
309
+ "phones": [
310
+ {
311
+ "ph": "Y",
312
+ "bg": 639,
313
+ "ed": 643
314
+ },
315
+ {
316
+ "ph": "UW",
317
+ "bg": 643,
318
+ "ed": 646
319
+ }
320
+ ]
321
+ },
322
+ {
323
+ "word": "GO",
324
+ "phones": [
325
+ {
326
+ "ph": "G",
327
+ "bg": 646,
328
+ "ed": 660
329
+ },
330
+ {
331
+ "ph": "OW",
332
+ "bg": 660,
333
+ "ed": 666
334
+ }
335
+ ]
336
+ },
337
+ {
338
+ "word": "ON",
339
+ "phones": [
340
+ {
341
+ "ph": "AO",
342
+ "bg": 666,
343
+ "ed": 719
344
+ },
345
+ {
346
+ "ph": "N",
347
+ "bg": 719,
348
+ "ed": 725
349
+ }
350
+ ]
351
+ },
352
+ {
353
+ "word": "AND",
354
+ "phones": [
355
+ {
356
+ "ph": "AH",
357
+ "bg": 725,
358
+ "ed": 728
359
+ },
360
+ {
361
+ "ph": "N",
362
+ "bg": 728,
363
+ "ed": 734
364
+ },
365
+ {
366
+ "ph": "D",
367
+ "bg": 734,
368
+ "ed": 753
369
+ }
370
+ ]
371
+ },
372
+ {
373
+ "word": "RUMORS",
374
+ "phones": [
375
+ {
376
+ "ph": "R",
377
+ "bg": 753,
378
+ "ed": 766
379
+ },
380
+ {
381
+ "ph": "UW",
382
+ "bg": 766,
383
+ "ed": 787
384
+ },
385
+ {
386
+ "ph": "M",
387
+ "bg": 787,
388
+ "ed": 793
389
+ },
390
+ {
391
+ "ph": "ER",
392
+ "bg": 793,
393
+ "ed": 797
394
+ },
395
+ {
396
+ "ph": "Z",
397
+ "bg": 797,
398
+ "ed": 809
399
+ }
400
+ ]
401
+ },
402
+ {
403
+ "word": "sil",
404
+ "phones": [
405
+ {
406
+ "ph": "SIL",
407
+ "bg": 809,
408
+ "ed": 820
409
+ }
410
+ ]
411
+ },
412
+ {
413
+ "word": "THAT",
414
+ "phones": [
415
+ {
416
+ "ph": "DH",
417
+ "bg": 819,
418
+ "ed": 824
419
+ },
420
+ {
421
+ "ph": "AH",
422
+ "bg": 825,
423
+ "ed": 841
424
+ },
425
+ {
426
+ "ph": "T",
427
+ "bg": 841,
428
+ "ed": 865
429
+ }
430
+ ]
431
+ },
432
+ {
433
+ "word": "WILL",
434
+ "phones": [
435
+ {
436
+ "ph": "W",
437
+ "bg": 865,
438
+ "ed": 870
439
+ },
440
+ {
441
+ "ph": "AH",
442
+ "bg": 869,
443
+ "ed": 872
444
+ },
445
+ {
446
+ "ph": "L",
447
+ "bg": 873,
448
+ "ed": 896
449
+ }
450
+ ]
451
+ },
452
+ {
453
+ "word": "sil",
454
+ "phones": [
455
+ {
456
+ "ph": "SIL",
457
+ "bg": 896,
458
+ "ed": 1018
459
+ }
460
+ ]
461
+ },
462
+ {
463
+ "word": "REDUCE",
464
+ "phones": [
465
+ {
466
+ "ph": "R",
467
+ "bg": 1018,
468
+ "ed": 1023
469
+ },
470
+ {
471
+ "ph": "AH",
472
+ "bg": 1023,
473
+ "ed": 1027
474
+ },
475
+ {
476
+ "ph": "D",
477
+ "bg": 1027,
478
+ "ed": 1031
479
+ },
480
+ {
481
+ "ph": "UW",
482
+ "bg": 1031,
483
+ "ed": 1043
484
+ },
485
+ {
486
+ "ph": "S",
487
+ "bg": 1043,
488
+ "ed": 1056
489
+ }
490
+ ]
491
+ },
492
+ {
493
+ "word": "THE",
494
+ "phones": [
495
+ {
496
+ "ph": "DH",
497
+ "bg": 1056,
498
+ "ed": 1079
499
+ },
500
+ {
501
+ "ph": "AH",
502
+ "bg": 1079,
503
+ "ed": 1084
504
+ }
505
+ ]
506
+ },
507
+ {
508
+ "word": "DO",
509
+ "phones": [
510
+ {
511
+ "ph": "D",
512
+ "bg": 1084,
513
+ "ed": 1087
514
+ },
515
+ {
516
+ "ph": "UW",
517
+ "bg": 1087,
518
+ "ed": 1100
519
+ }
520
+ ]
521
+ },
522
+ {
523
+ "word": "GET",
524
+ "phones": [
525
+ {
526
+ "ph": "G",
527
+ "bg": 1100,
528
+ "ed": 1106
529
+ },
530
+ {
531
+ "ph": "IH",
532
+ "bg": 1106,
533
+ "ed": 1112
534
+ },
535
+ {
536
+ "ph": "T",
537
+ "bg": 1112,
538
+ "ed": 1118
539
+ }
540
+ ]
541
+ },
542
+ {
543
+ "word": "THE",
544
+ "phones": [
545
+ {
546
+ "ph": "DH",
547
+ "bg": 1118,
548
+ "ed": 1126
549
+ },
550
+ {
551
+ "ph": "IY",
552
+ "bg": 1126,
553
+ "ed": 1130
554
+ }
555
+ ]
556
+ },
557
+ {
558
+ "word": "UNIONS",
559
+ "phones": [
560
+ {
561
+ "ph": "Y",
562
+ "bg": 1130,
563
+ "ed": 1135
564
+ },
565
+ {
566
+ "ph": "UW",
567
+ "bg": 1135,
568
+ "ed": 1150
569
+ },
570
+ {
571
+ "ph": "N",
572
+ "bg": 1150,
573
+ "ed": 1153
574
+ },
575
+ {
576
+ "ph": "Y",
577
+ "bg": 1153,
578
+ "ed": 1164
579
+ },
580
+ {
581
+ "ph": "AH",
582
+ "bg": 1164,
583
+ "ed": 1169
584
+ },
585
+ {
586
+ "ph": "N",
587
+ "bg": 1169,
588
+ "ed": 1175
589
+ },
590
+ {
591
+ "ph": "Z",
592
+ "bg": 1175,
593
+ "ed": 1205
594
+ }
595
+ ]
596
+ },
597
+ {
598
+ "word": "YOUR",
599
+ "phones": [
600
+ {
601
+ "ph": "Y",
602
+ "bg": 1205,
603
+ "ed": 1208
604
+ },
605
+ {
606
+ "ph": "UH",
607
+ "bg": 1208,
608
+ "ed": 1212
609
+ },
610
+ {
611
+ "ph": "R",
612
+ "bg": 1212,
613
+ "ed": 1215
614
+ }
615
+ ]
616
+ },
617
+ {
618
+ "word": "OWN",
619
+ "phones": [
620
+ {
621
+ "ph": "OW",
622
+ "bg": 1215,
623
+ "ed": 1251
624
+ },
625
+ {
626
+ "ph": "N",
627
+ "bg": 1251,
628
+ "ed": 1259
629
+ }
630
+ ]
631
+ },
632
+ {
633
+ "word": "COLOR",
634
+ "phones": [
635
+ {
636
+ "ph": "K",
637
+ "bg": 1259,
638
+ "ed": 1288
639
+ },
640
+ {
641
+ "ph": "AH",
642
+ "bg": 1288,
643
+ "ed": 1291
644
+ },
645
+ {
646
+ "ph": "L",
647
+ "bg": 1291,
648
+ "ed": 1301
649
+ },
650
+ {
651
+ "ph": "ER",
652
+ "bg": 1301,
653
+ "ed": 1311
654
+ }
655
+ ]
656
+ },
657
+ {
658
+ "word": "OR",
659
+ "phones": [
660
+ {
661
+ "ph": "AO",
662
+ "bg": 1311,
663
+ "ed": 1328
664
+ },
665
+ {
666
+ "ph": "R",
667
+ "bg": 1328,
668
+ "ed": 1332
669
+ }
670
+ ]
671
+ },
672
+ {
673
+ "word": "sil",
674
+ "phones": [
675
+ {
676
+ "ph": "SIL",
677
+ "bg": 1332,
678
+ "ed": 1335
679
+ }
680
+ ]
681
+ },
682
+ {
683
+ "word": "WHAT",
684
+ "phones": [
685
+ {
686
+ "ph": "HH",
687
+ "bg": 1335,
688
+ "ed": 1349
689
+ },
690
+ {
691
+ "ph": "W",
692
+ "bg": 1349,
693
+ "ed": 1361
694
+ },
695
+ {
696
+ "ph": "AH",
697
+ "bg": 1361,
698
+ "ed": 1364
699
+ },
700
+ {
701
+ "ph": "T",
702
+ "bg": 1364,
703
+ "ed": 1379
704
+ }
705
+ ]
706
+ },
707
+ {
708
+ "word": "WHAT",
709
+ "phones": [
710
+ {
711
+ "ph": "HH",
712
+ "bg": 1379,
713
+ "ed": 1387
714
+ },
715
+ {
716
+ "ph": "W",
717
+ "bg": 1387,
718
+ "ed": 1390
719
+ },
720
+ {
721
+ "ph": "AH",
722
+ "bg": 1390,
723
+ "ed": 1394
724
+ },
725
+ {
726
+ "ph": "T",
727
+ "bg": 1394,
728
+ "ed": 1403
729
+ }
730
+ ]
731
+ },
732
+ {
733
+ "word": "A",
734
+ "phones": [
735
+ {
736
+ "ph": "EY",
737
+ "bg": 1403,
738
+ "ed": 1421
739
+ }
740
+ ]
741
+ },
742
+ {
743
+ "word": "SIL",
744
+ "phones": [
745
+ {
746
+ "ph": "SIL",
747
+ "bg": 1421,
748
+ "ed": 1432
749
+ }
750
+ ]
751
+ },
752
+ {
753
+ "word": "BOON",
754
+ "phones": [
755
+ {
756
+ "ph": "B",
757
+ "bg": 1432,
758
+ "ed": 1436
759
+ },
760
+ {
761
+ "ph": "UW",
762
+ "bg": 1436,
763
+ "ed": 1446
764
+ },
765
+ {
766
+ "ph": "N",
767
+ "bg": 1446,
768
+ "ed": 1471
769
+ }
770
+ ]
771
+ },
772
+ {
773
+ "word": "sil",
774
+ "phones": [
775
+ {
776
+ "ph": "SIL",
777
+ "bg": 1471,
778
+ "ed": 1511
779
+ }
780
+ ]
781
+ },
782
+ {
783
+ "word": "FOR",
784
+ "phones": [
785
+ {
786
+ "ph": "F",
787
+ "bg": 1511,
788
+ "ed": 1519
789
+ },
790
+ {
791
+ "ph": "R",
792
+ "bg": 1519,
793
+ "ed": 1526
794
+ },
795
+ {
796
+ "ph": "ER",
797
+ "bg": 1526,
798
+ "ed": 1529
799
+ }
800
+ ]
801
+ },
802
+ {
803
+ "word": "LUNCH",
804
+ "phones": [
805
+ {
806
+ "ph": "L",
807
+ "bg": 1529,
808
+ "ed": 1537
809
+ },
810
+ {
811
+ "ph": "AH",
812
+ "bg": 1537,
813
+ "ed": 1541
814
+ },
815
+ {
816
+ "ph": "N",
817
+ "bg": 1541,
818
+ "ed": 1547
819
+ },
820
+ {
821
+ "ph": "CH",
822
+ "bg": 1547,
823
+ "ed": 1570
824
+ }
825
+ ]
826
+ },
827
+ {
828
+ "word": "sil",
829
+ "phones": [
830
+ {
831
+ "ph": "SIL",
832
+ "bg": 1570,
833
+ "ed": 1574
834
+ }
835
+ ]
836
+ },
837
+ {
838
+ "word": "THEY",
839
+ "phones": [
840
+ {
841
+ "ph": "DH",
842
+ "bg": 1574,
843
+ "ed": 1584
844
+ },
845
+ {
846
+ "ph": "EY",
847
+ "bg": 1584,
848
+ "ed": 1610
849
+ }
850
+ ]
851
+ },
852
+ {
853
+ "word": "ISSUE",
854
+ "phones": [
855
+ {
856
+ "ph": "IH",
857
+ "bg": 1610,
858
+ "ed": 1616
859
+ },
860
+ {
861
+ "ph": "SH",
862
+ "bg": 1616,
863
+ "ed": 1641
864
+ },
865
+ {
866
+ "ph": "UW",
867
+ "bg": 1641,
868
+ "ed": 1680
869
+ }
870
+ ]
871
+ },
872
+ {
873
+ "word": "sil",
874
+ "phones": [
875
+ {
876
+ "ph": "SIL",
877
+ "bg": 1680,
878
+ "ed": 1688
879
+ }
880
+ ]
881
+ },
882
+ {
883
+ "word": "IS",
884
+ "phones": [
885
+ {
886
+ "ph": "IH",
887
+ "bg": 1688,
888
+ "ed": 1695
889
+ },
890
+ {
891
+ "ph": "Z",
892
+ "bg": 1695,
893
+ "ed": 1715
894
+ }
895
+ ]
896
+ },
897
+ {
898
+ "word": "NOT",
899
+ "phones": [
900
+ {
901
+ "ph": "N",
902
+ "bg": 1714,
903
+ "ed": 1725
904
+ },
905
+ {
906
+ "ph": "AA",
907
+ "bg": 1726,
908
+ "ed": 1737
909
+ },
910
+ {
911
+ "ph": "T",
912
+ "bg": 1737,
913
+ "ed": 1740
914
+ }
915
+ ]
916
+ },
917
+ {
918
+ "word": "SURE",
919
+ "phones": [
920
+ {
921
+ "ph": "SH",
922
+ "bg": 1739,
923
+ "ed": 1764
924
+ },
925
+ {
926
+ "ph": "UH",
927
+ "bg": 1764,
928
+ "ed": 1773
929
+ },
930
+ {
931
+ "ph": "R",
932
+ "bg": 1773,
933
+ "ed": 1778
934
+ }
935
+ ]
936
+ },
937
+ {
938
+ "word": "WHAT",
939
+ "phones": [
940
+ {
941
+ "ph": "W",
942
+ "bg": 1779,
943
+ "ed": 1782
944
+ },
945
+ {
946
+ "ph": "AH",
947
+ "bg": 1782,
948
+ "ed": 1786
949
+ },
950
+ {
951
+ "ph": "T",
952
+ "bg": 1786,
953
+ "ed": 1828
954
+ }
955
+ ]
956
+ },
957
+ {
958
+ "word": "sil",
959
+ "phones": [
960
+ {
961
+ "ph": "SIL",
962
+ "bg": 1828,
963
+ "ed": 1846
964
+ }
965
+ ]
966
+ },
967
+ {
968
+ "word": "</S>",
969
+ "phones": [
970
+ {
971
+ "ph": "SIL",
972
+ "bg": 1846,
973
+ "ed": 1900
974
+ }
975
+ ]
976
+ }
977
+ ]