Suprath commited on
Commit
8964b86
·
verified ·
1 Parent(s): 55c3ec1

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +2 -8
app.py CHANGED
@@ -192,20 +192,14 @@ text_output = gr.Textbox()
192
  with demo:
193
  gr.Markdown('''
194
  <div>
195
- <h1 style='text-align: center'>Speech Recognition from Visual Lip Movement by Audio-Visual Hidden Unit BERT Model (AV-HuBERT)</h1>
196
- This space uses AV-HuBERT models from <a href='https://github.com/facebookresearch' target='_blank'><b>Meta Research</b></a> to recoginze the speech from Lip Movement
197
- <figure>
198
- <img src="https://huggingface.co/vumichien/AV-HuBERT/resolve/main/lipreading.gif" alt="Audio-Visual Speech Recognition">
199
- <figcaption> Speech Recognition from visual lip movement
200
- </figcaption>
201
- </figure>
202
  </div>
203
  ''')
204
  with gr.Row():
205
  gr.Markdown('''
206
  ### Reading Lip movement with youtube link using Avhubert
207
  ##### Step 1a. Download video from youtube (Note: the length of video should be less than 10 seconds if not it will be cut and the face should be stable for better result)
208
- ##### Step 1b. You also can upload video directly
209
  ##### Step 2. Generating landmarks surrounding mouth area
210
  ##### Step 3. Reading lip movement.
211
  ''')
 
192
  with demo:
193
  gr.Markdown('''
194
  <div>
195
+ <h1 style='text-align: center'>Lip Reading Using Machine learning (Audio-Visual Hidden Unit BERT Model (AV-HuBERT))</h1>
 
 
 
 
 
 
196
  </div>
197
  ''')
198
  with gr.Row():
199
  gr.Markdown('''
200
  ### Reading Lip movement with youtube link using Avhubert
201
  ##### Step 1a. Download video from youtube (Note: the length of video should be less than 10 seconds if not it will be cut and the face should be stable for better result)
202
+ ##### Step 1b. Drag and drop videos to upload directly
203
  ##### Step 2. Generating landmarks surrounding mouth area
204
  ##### Step 3. Reading lip movement.
205
  ''')