Update app.py
Browse files
app.py
CHANGED
|
@@ -192,20 +192,14 @@ text_output = gr.Textbox()
|
|
| 192 |
with demo:
|
| 193 |
gr.Markdown('''
|
| 194 |
<div>
|
| 195 |
-
<h1 style='text-align: center'>
|
| 196 |
-
This space uses AV-HuBERT models from <a href='https://github.com/facebookresearch' target='_blank'><b>Meta Research</b></a> to recoginze the speech from Lip Movement
|
| 197 |
-
<figure>
|
| 198 |
-
<img src="https://huggingface.co/vumichien/AV-HuBERT/resolve/main/lipreading.gif" alt="Audio-Visual Speech Recognition">
|
| 199 |
-
<figcaption> Speech Recognition from visual lip movement
|
| 200 |
-
</figcaption>
|
| 201 |
-
</figure>
|
| 202 |
</div>
|
| 203 |
''')
|
| 204 |
with gr.Row():
|
| 205 |
gr.Markdown('''
|
| 206 |
### Reading Lip movement with youtube link using Avhubert
|
| 207 |
##### Step 1a. Download video from youtube (Note: the length of video should be less than 10 seconds if not it will be cut and the face should be stable for better result)
|
| 208 |
-
##### Step 1b.
|
| 209 |
##### Step 2. Generating landmarks surrounding mouth area
|
| 210 |
##### Step 3. Reading lip movement.
|
| 211 |
''')
|
|
|
|
| 192 |
with demo:
|
| 193 |
gr.Markdown('''
|
| 194 |
<div>
|
| 195 |
+
<h1 style='text-align: center'>Lip Reading Using Machine learning (Audio-Visual Hidden Unit BERT Model (AV-HuBERT))</h1>
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 196 |
</div>
|
| 197 |
''')
|
| 198 |
with gr.Row():
|
| 199 |
gr.Markdown('''
|
| 200 |
### Reading Lip movement with youtube link using Avhubert
|
| 201 |
##### Step 1a. Download video from youtube (Note: the length of video should be less than 10 seconds if not it will be cut and the face should be stable for better result)
|
| 202 |
+
##### Step 1b. Drag and drop videos to upload directly
|
| 203 |
##### Step 2. Generating landmarks surrounding mouth area
|
| 204 |
##### Step 3. Reading lip movement.
|
| 205 |
''')
|