arunasrivastava commited on
Commit
a5a6781
·
1 Parent(s): 3a023fb

without eval library

Browse files
Files changed (4) hide show
  1. app.py +2 -2
  2. queue/leaderboard.json +10 -0
  3. queue/results.json +46 -0
  4. queue/tasks.json +1 -1
app.py CHANGED
@@ -36,7 +36,7 @@ def format_leaderboard_df(df):
36
  "Model": df["model"],
37
  "Average PER ⬇️": df["average_per"].apply(lambda x: f"{x:.4f}"),
38
  "Average PWED ⬇️": df["average_pwed"].apply(lambda x: f"{x:.4f}"),
39
- "GitHub": df["github_url"].apply(lambda x: f'<a href="{x}" target="_blank">Repository</a>' if x else "N/A"),
40
  "Submission Date": pd.to_datetime(df["submission_date"]).dt.strftime("%Y-%m-%d")
41
  })
42
 
@@ -152,7 +152,7 @@ with gr.Blocks(css="""
152
  gr.Markdown("""
153
  ## Explanation of Metrics
154
  - **PER (Phoneme Error Rate)**: The Levenshtein distance calculated between phoneme sequences of the predicted and actual transcriptions.
155
- - **PWED (Phoneme Weighted Edit Distance)**: A measure of the edit distance between the predicted and actual phoneme sequences, weighted by the phonemic feature distance. Feature vectors provided by panphon library
156
  """)
157
  gr.Markdown("""
158
  ## Test Set Information
 
36
  "Model": df["model"],
37
  "Average PER ⬇️": df["average_per"].apply(lambda x: f"{x:.4f}"),
38
  "Average PWED ⬇️": df["average_pwed"].apply(lambda x: f"{x:.4f}"),
39
+ "Link": df["github_url"].apply(lambda x: f'<a href="{x}" target="_blank">Repository</a>' if x else "N/A"),
40
  "Submission Date": pd.to_datetime(df["submission_date"]).dt.strftime("%Y-%m-%d")
41
  })
42
 
 
152
  gr.Markdown("""
153
  ## Explanation of Metrics
154
  - **PER (Phoneme Error Rate)**: The Levenshtein distance calculated between phoneme sequences of the predicted and actual transcriptions.
155
+ - **PWED (Phoneme Weighted Edit Distance)**: Edit distance between the predicted and actual phoneme sequences, weighted by the phonemic feature distance. Method provided by [panphon library](https://github.com/dmort27/panphon)
156
  """)
157
  gr.Markdown("""
158
  ## Test Set Information
queue/leaderboard.json CHANGED
@@ -178,5 +178,15 @@
178
  "subset": "test",
179
  "github_url": "https://huggingface.co/speech31/wav2vec2-large-TIMIT-IPA2",
180
  "submission_date": "2024-12-20T22:50:50.645178"
 
 
 
 
 
 
 
 
 
 
181
  }
182
  ]
 
178
  "subset": "test",
179
  "github_url": "https://huggingface.co/speech31/wav2vec2-large-TIMIT-IPA2",
180
  "submission_date": "2024-12-20T22:50:50.645178"
181
+ },
182
+ {
183
+ "submission_id": "4126d265-418f-4d11-8a29-4e69f064f1dd",
184
+ "submission_name": "ginic model, facebook/wav2vec2-large-xlsr-53 fine tuned",
185
+ "model": "ginic/vary_individuals_young_only_3_wav2vec2-large-xlsr-buckeye-ipa",
186
+ "average_per": 0.2807914104790719,
187
+ "average_pwed": 0.10494355278037441,
188
+ "subset": "test",
189
+ "github_url": "https://huggingface.co/ginic/vary_individuals_young_only_3_wav2vec2-large-xlsr-buckeye-ipa",
190
+ "submission_date": "2024-12-21T01:31:04.862397"
191
  }
192
  ]
queue/results.json CHANGED
@@ -964,5 +964,51 @@
964
  }
965
  ],
966
  "timestamp": "2024-12-20T22:50:50.641790"
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
967
  }
968
  ]
 
964
  }
965
  ],
966
  "timestamp": "2024-12-20T22:50:50.641790"
967
+ },
968
+ {
969
+ "task_id": "81fa94f8-94ae-4601-952c-24abaddaf691",
970
+ "model": "ginic/vary_individuals_young_only_3_wav2vec2-large-xlsr-buckeye-ipa",
971
+ "subset": "test",
972
+ "num_files": 1680,
973
+ "average_per": 0.2807914104790719,
974
+ "average_pwed": 0.10494355278037441,
975
+ "detailed_results": [
976
+ {
977
+ "file": "data/TEST/DR1/FAKS0/SA1.WAV",
978
+ "ground_truth": "ʃihædjɹdɑɹksuɾɪŋgɹisiwɑʃwɑɾɹʔɔljiɹ",
979
+ "prediction": "ʃihædjɹdɑɹksuɾɪnɡɹisiwɔʃwɔɾɹ̩ɔljiɹ",
980
+ "per": 0.18181818181818182,
981
+ "pwed": 0.0744949494949495
982
+ },
983
+ {
984
+ "file": "data/TEST/DR1/FAKS0/SA2.WAV",
985
+ "ground_truth": "oʊnæsmitikɛɹiinɔɪliɹæglaɪkðæt",
986
+ "prediction": "doʊndæskmidɪkæɹiɪnɔɪliɹæɡlaɪkðæʔ",
987
+ "per": 0.32142857142857145,
988
+ "pwed": 0.140625
989
+ },
990
+ {
991
+ "file": "data/TEST/DR1/FAKS0/SI1573.WAV",
992
+ "ground_truth": "hɪzkæpinwəsθɪnænhægɹdinɪzbjuɾuflbutswɹwɔɹninʃæbi",
993
+ "prediction": "hɪzkæptʌnwʌzθɪnɛnhæɡɹ̩dɛnɪzbjuɾʌfl̩butswɹ̩wɔɹnɪnʃæbi",
994
+ "per": 0.2553191489361702,
995
+ "pwed": 0.05357142857142856
996
+ },
997
+ {
998
+ "file": "data/TEST/DR1/FAKS0/SI2203.WAV",
999
+ "ground_truth": "ðiɹizənzfɹðɪsdaɪvsimdfuliʃnaʊ",
1000
+ "prediction": "ðʌɹizʌn̩zfɹðʌstaɪvsimtfulɪʃnaʊ",
1001
+ "per": 0.2413793103448276,
1002
+ "pwed": 0.014367816091954023
1003
+ },
1004
+ {
1005
+ "file": "data/TEST/DR1/FAKS0/SI943.WAV",
1006
+ "ground_truth": "ɹdʌkʃinmeɪfɔlfɑɹbəloʊəkspikeɪʃnts",
1007
+ "prediction": "pɹʌdʌkʃn̩meɪfɔlfɑɹbʌloʊɛkspɛkteɪʃʌns",
1008
+ "per": 0.30303030303030304,
1009
+ "pwed": 0.12023809523809523
1010
+ }
1011
+ ],
1012
+ "timestamp": "2024-12-21T01:31:04.859070"
1013
  }
1014
  ]
queue/tasks.json CHANGED
@@ -251,7 +251,7 @@
251
  "subset": "test",
252
  "submission_name": "ginic model, facebook/wav2vec2-large-xlsr-53 fine tuned",
253
  "github_url": "https://huggingface.co/ginic/vary_individuals_young_only_3_wav2vec2-large-xlsr-buckeye-ipa",
254
- "status": "processing",
255
  "submitted_at": "2024-12-21T01:15:41.870875"
256
  }
257
  ]
 
251
  "subset": "test",
252
  "submission_name": "ginic model, facebook/wav2vec2-large-xlsr-53 fine tuned",
253
  "github_url": "https://huggingface.co/ginic/vary_individuals_young_only_3_wav2vec2-large-xlsr-buckeye-ipa",
254
+ "status": "completed",
255
  "submitted_at": "2024-12-21T01:15:41.870875"
256
  }
257
  ]