IPA-Transcription-EN

Sleeping

App Files Files Community

arunasrivastava commited on Dec 19, 2024

Commit

03346c0

1 Parent(s): 7d25ccc

updating descriptions

Browse files

Files changed (6) hide show

__pycache__/main.cpython-310.pyc +0 -0
app.py +6 -5
main.py +1 -1
queue/leaderboard.json +30 -0
queue/results.json +138 -0
queue/tasks.json +36 -0

__pycache__/main.cpython-310.pyc CHANGED Viewed

Binary files a/__pycache__/main.cpython-310.pyc and b/__pycache__/main.cpython-310.pyc differ

app.py CHANGED Viewed

@@ -135,7 +135,7 @@ with gr.Blocks(css="""
         box-shadow: 0 0 20px rgba(0, 0, 0, 0.15);
     }
     .styled-table thead tr {
-        background-color: #96b9D0;
         color: #ffffff;
         text-align: left;
     }
@@ -157,22 +157,23 @@ with gr.Blocks(css="""
     ## Test Set Information
     The test set used for evaluation is from the [TIMIT speech corpus](https://www.kaggle.com/datasets/mfekadu/darpa-timit-acousticphonetic-continuous-speech). The TIMIT corpus is a widely used dataset for speech recognition research.
-    ## Processing Time
-    Please note that processing will take around 2 minutes.
     """)
     with gr.Tabs():
         with gr.TabItem("🏆 Leaderboard"):
             leaderboard_html = gr.HTML(create_html_table(format_leaderboard_df(load_leaderboard_data())))
             refresh_btn = gr.Button("🔄 Refresh")
             refresh_btn.click(
-                lambda: gr.HTML.update(value=create_html_table(format_leaderboard_df(load_leaderboard_data()))),
                 outputs=leaderboard_html
             )
         with gr.TabItem("📝 Submit Model"):
             model_name = gr.Textbox(label="Model Name", placeholder="facebook/wav2vec2-lv-60-espeak-cv-ft")
             submission_name = gr.Textbox(label="Submission Name", placeholder="My Model v1.0")
-            github_url = gr.Textbox(label="GitHub URL (optional)", placeholder="https://github.com/username/repo")
             submit_btn = gr.Button("Submit")
             result = gr.Textbox(label="Submission Status")

         box-shadow: 0 0 20px rgba(0, 0, 0, 0.15);
     }
     .styled-table thead tr {
+        background-color: #004999;
         color: #ffffff;
         text-align: left;
     }
     ## Test Set Information
     The test set used for evaluation is from the [TIMIT speech corpus](https://www.kaggle.com/datasets/mfekadu/darpa-timit-acousticphonetic-continuous-speech). The TIMIT corpus is a widely used dataset for speech recognition research.
+    ## Compute
+    This leaderboard uses the free basic plan (16GB RAM, 2vCPUs). The evaluation may take several hours to complete. Please be patient and do not submit the same model multiple times.
     """)
     with gr.Tabs():
         with gr.TabItem("🏆 Leaderboard"):
             leaderboard_html = gr.HTML(create_html_table(format_leaderboard_df(load_leaderboard_data())))
             refresh_btn = gr.Button("🔄 Refresh")
             refresh_btn.click(
+                lambda: create_html_table(format_leaderboard_df(load_leaderboard_data())),
                 outputs=leaderboard_html
             )
         with gr.TabItem("📝 Submit Model"):
             model_name = gr.Textbox(label="Model Name", placeholder="facebook/wav2vec2-lv-60-espeak-cv-ft")
             submission_name = gr.Textbox(label="Submission Name", placeholder="My Model v1.0")
+            github_url = gr.Textbox(label="Github/Kaggle/HF URL (optional)", placeholder="https://github.com/username/repo")
             submit_btn = gr.Button("Submit")
             result = gr.Textbox(label="Submission Status")

main.py CHANGED Viewed

@@ -488,7 +488,7 @@ async def get_leaderboard():
     """Get current leaderboard"""
     try:
         leaderboard = storage_manager.load('leaderboard')
-        sorted_leaderboard = sorted(leaderboard, key=lambda x: (x["average_per"], x["average_pwed"]))
         return sorted_leaderboard
     except Exception as e:
         print(f"Error loading leaderboard: {e}")

     """Get current leaderboard"""
     try:
         leaderboard = storage_manager.load('leaderboard')
+        sorted_leaderboard = sorted(leaderboard, key=lambda x: (x["average_pwed"], x["average_per"]))
         return sorted_leaderboard
     except Exception as e:
         print(f"Error loading leaderboard: {e}")

queue/leaderboard.json CHANGED Viewed

@@ -68,5 +68,35 @@
         "subset": "test",
         "github_url": "https://github.com/KoelLabs/ML/",
         "submission_date": "2024-12-12T16:07:25.391145"
     }
 ]

         "subset": "test",
         "github_url": "https://github.com/KoelLabs/ML/",
         "submission_date": "2024-12-12T16:07:25.391145"
+    },
+    {
+        "submission_id": "02f223d4-7b98-4613-9377-19b74defe308",
+        "submission_name": "wav2vec2 ipa eng ",
+        "model": "snu-nia-12/wav2vec2-large_nia12_phone-ipa_english",
+        "average_per": 0.4847029843149011,
+        "average_pwed": 0.2072006544586948,
+        "subset": "test",
+        "github_url": null,
+        "submission_date": "2024-12-18T22:01:20.855881"
+    },
+    {
+        "submission_id": "bed08468-42c7-459f-a46d-49ead50abfbc",
+        "submission_name": "fine-tuned version of facebook/wav2vec2-xls-r-300m on the Timit dataset",
+        "model": "vitouphy/wav2vec2-xls-r-300m-timit-phoneme",
+        "average_per": 0.2561961414705681,
+        "average_pwed": 0.1378394393452702,
+        "subset": "test",
+        "github_url": "https://www.kaggle.com/code/vitouphy/phoneme-recognition-with-wav2vec2",
+        "submission_date": "2024-12-18T22:50:59.627338"
+    },
+    {
+        "submission_id": "4086072e-9368-442f-97cd-1fda6bf6656e",
+        "submission_name": "wav2vec2 model",
+        "model": "ctaguchi/wav2vec2-large-xlsr-japlmthufielta-ipa-plus-2000",
+        "average_per": 0.6479484324708775,
+        "average_pwed": 0.18710002665151734,
+        "subset": "test",
+        "github_url": "https://huggingface.co/ctaguchi/wav2vec2-large-xlsr-japlmthufielta-ipa1000-ns",
+        "submission_date": "2024-12-18T23:29:27.322286"
     }
 ]

queue/results.json CHANGED Viewed

@@ -366,5 +366,143 @@
             }
         ],
         "timestamp": "2024-12-12T16:07:25.389475"
     }
 ]

             }
         ],
         "timestamp": "2024-12-12T16:07:25.389475"
+    },
+    {
+        "task_id": "2e592612-ca38-4afb-a6a0-3c870b288960",
+        "model": "snu-nia-12/wav2vec2-large_nia12_phone-ipa_english",
+        "subset": "test",
+        "num_files": 1680,
+        "average_per": 0.4847029843149011,
+        "average_pwed": 0.2072006544586948,
+        "detailed_results": [
+            {
+                "file": "data/TEST/DR1/FAKS0/SA1.WAV",
+                "ground_truth": "ʃihædjɹdɑɹksuɾɪŋgɹisiwɑʃwɑɾɹʔɔljiɹ",
+                "prediction": "ʃihædjʊrdɑrksutɪngrisiwɑʃwɔtərɔljɪrər",
+                "per": 0.42424242424242425,
+                "pwed": 0.15393518518518517
+            },
+            {
+                "file": "data/TEST/DR1/FAKS0/SA2.WAV",
+                "ground_truth": "oʊnæsmitikɛɹiinɔɪliɹæglaɪkðæt",
+                "prediction": "doʊntæskmitɪkɛriənɔɪliræglaɪkðətdoʊndt",
+                "per": 0.5,
+                "pwed": 0.2623873873873874
+            },
+            {
+                "file": "data/TEST/DR1/FAKS0/SI1573.WAV",
+                "ground_truth": "hɪzkæpinwəsθɪnænhægɹdinɪzbjuɾuflbutswɹwɔɹninʃæbi",
+                "prediction": "hɪzkæptənwɑzθɪnəndhægərdəndhɪzbjutəfəlbutswərwɔrnəndʃæbiiii",
+                "per": 0.46808510638297873,
+                "pwed": 0.2191091954022989
+            },
+            {
+                "file": "data/TEST/DR1/FAKS0/SI2203.WAV",
+                "ground_truth": "ðiɹizənzfɹðɪsdaɪvsimdfuliʃnaʊ",
+                "prediction": "ðərizənzfərðɪstaɪvsimdfulɪʃnaʊ",
+                "per": 0.20689655172413793,
+                "pwed": 0.054166666666666675
+            },
+            {
+                "file": "data/TEST/DR1/FAKS0/SI943.WAV",
+                "ground_truth": "ɹdʌkʃinmeɪfɔlfɑɹbəloʊəkspikeɪʃnts",
+                "prediction": "prədəkʃənmeɪfɔlfɑrbɪloʊɛkspɛkteɪʃənzpzppppzpdtdtd",
+                "per": 0.7272727272727273,
+                "pwed": 0.34438775510204084
+            }
+        ],
+        "timestamp": "2024-12-18T22:01:20.853274"
+    },
+    {
+        "task_id": "d38e65ce-75b5-4dbf-8ade-bff6a5803790",
+        "model": "vitouphy/wav2vec2-xls-r-300m-timit-phoneme",
+        "subset": "test",
+        "num_files": 1680,
+        "average_per": 0.2561961414705681,
+        "average_pwed": 0.1378394393452702,
+        "detailed_results": [
+            {
+                "file": "data/TEST/DR1/FAKS0/SA1.WAV",
+                "ground_truth": "ʃihædjɹdɑɹksuɾɪŋgɹisiwɑʃwɑɾɹʔɔljiɹ",
+                "prediction": "ʃihædjɝdɑɹksuɾɪngɹisiwɑʃwɑɾɝɑljiɝ",
+                "per": 0.18181818181818182,
+                "pwed": 0.13257575757575757
+            },
+            {
+                "file": "data/TEST/DR1/FAKS0/SA2.WAV",
+                "ground_truth": "oʊnæsmitikɛɹiinɔɪliɹæglaɪkðæt",
+                "prediction": "doʊnæskmitɪkæɹiɪnɔɪliɹæglaɪkðæ",
+                "per": 0.21428571428571427,
+                "pwed": 0.10919540229885057
+            },
+            {
+                "file": "data/TEST/DR1/FAKS0/SI1573.WAV",
+                "ground_truth": "hɪzkæpinwəsθɪnænhægɹdinɪzbjuɾuflbutswɹwɔɹninʃæbi",
+                "prediction": "hɪzkætɪnwəsθɪnənhægɝdɪnɪzbjuɾɪflbutswɝwɑɹnɪnʃæbi",
+                "per": 0.19148936170212766,
+                "pwed": 0.0576241134751773
+            },
+            {
+                "file": "data/TEST/DR1/FAKS0/SI2203.WAV",
+                "ground_truth": "ðiɹizənzfɹðɪsdaɪvsimdfuliʃnaʊ",
+                "prediction": "ðɪɹizənzfɝðɪsdaɪvsimdfulɪʃnaʊ",
+                "per": 0.10344827586206896,
+                "pwed": 0.03735632183908046
+            },
+            {
+                "file": "data/TEST/DR1/FAKS0/SI943.WAV",
+                "ground_truth": "ɹdʌkʃinmeɪfɔlfɑɹbəloʊəkspikeɪʃnts",
+                "prediction": "pɹɝdəkʃɪnmeɪfɑlfɹbloʊɛkspɛteɪʃɪns",
+                "per": 0.3333333333333333,
+                "pwed": 0.12373737373737376
+            }
+        ],
+        "timestamp": "2024-12-18T22:50:59.625872"
+    },
+    {
+        "task_id": "2839c0c6-8f3b-426e-9eb7-04b6e133dc47",
+        "model": "ctaguchi/wav2vec2-large-xlsr-japlmthufielta-ipa-plus-2000",
+        "subset": "test",
+        "num_files": 1680,
+        "average_per": 0.6479484324708775,
+        "average_pwed": 0.18710002665151734,
+        "detailed_results": [
+            {
+                "file": "data/TEST/DR1/FAKS0/SA1.WAV",
+                "ground_truth": "ʃihædjɹdɑɹksuɾɪŋgɹisiwɑʃwɑɾɹʔɔljiɹ",
+                "prediction": "ʂixadjodarksyːdɨnɡwisiwaːʃwarɒɔjiːr",
+                "per": 0.6060606060606061,
+                "pwed": 0.15404040404040406
+            },
+            {
+                "file": "data/TEST/DR1/FAKS0/SA2.WAV",
+                "ground_truth": "oʊnæsmitikɛɹiinɔɪliɹæglaɪkðæt",
+                "prediction": "dondaːskmiːdɨkɛːɻjɒnojluiʋɻaːɡlɑjɡtaːn",
+                "per": 0.8928571428571429,
+                "pwed": 0.2146464646464646
+            },
+            {
+                "file": "data/TEST/DR1/FAKS0/SI1573.WAV",
+                "ground_truth": "hɪzkæpinwəsθɪnænhægɹdinɪzbjuɾuflbutswɹwɔɹninʃæbi",
+                "prediction": "hizkaːptanustinanhagɛɻdɛnizbiurufubutswuɾʋoːɻninʂaːbi",
+                "per": 0.5106382978723404,
+                "pwed": 0.1096938775510204
+            },
+            {
+                "file": "data/TEST/DR1/FAKS0/SI2203.WAV",
+                "ground_truth": "ðiɹizənzfɹðɪsdaɪvsimdfuliʃnaʊ",
+                "prediction": "ðrisɔnsfrdɔsdaːjvsimtfulɛʂnɛ",
+                "per": 0.5172413793103449,
+                "pwed": 0.11063218390804598
+            },
+            {
+                "file": "data/TEST/DR1/FAKS0/SI943.WAV",
+                "ground_truth": "ɹdʌkʃinmeɪfɔlfɑɹbəloʊəkspikeɪʃnts",
+                "prediction": "pɛdakɕɔnmɛjfaɔfarbuwɔwɛkspɛktajʂɔnt͡s",
+                "per": 0.7272727272727273,
+                "pwed": 0.15
+            }
+        ],
+        "timestamp": "2024-12-18T23:29:27.320433"
     }
 ]

queue/tasks.json CHANGED Viewed

@@ -88,5 +88,41 @@
         "github_url": "https://github.com/KoelLabs/ML/",
         "status": "completed",
         "submitted_at": "2024-12-12T15:53:07.620070"
     }
 ]

         "github_url": "https://github.com/KoelLabs/ML/",
         "status": "completed",
         "submitted_at": "2024-12-12T15:53:07.620070"
+    },
+    {
+        "id": "2e592612-ca38-4afb-a6a0-3c870b288960",
+        "model": "snu-nia-12/wav2vec2-large_nia12_phone-ipa_english",
+        "subset": "test",
+        "submission_name": "wav2vec2 ipa eng ",
+        "github_url": "",
+        "status": "completed",
+        "submitted_at": "2024-12-18T21:41:21.861322"
+    },
+    {
+        "id": "ac4cbe86-4dbe-4929-8f76-4d2052e0acf1",
+        "model": "vitouphy/wav2vec2-xls-r-300m-timit-phoneme",
+        "subset": "test",
+        "submission_name": "fine-tuned version of facebook/wav2vec2-xls-r-300m on the Timit dataset",
+        "github_url": "https://www.kaggle.com/code/vitouphy/phoneme-recognition-with-wav2vec2",
+        "status": "processing",
+        "submitted_at": "2024-12-18T22:09:03.412372"
+    },
+    {
+        "id": "d38e65ce-75b5-4dbf-8ade-bff6a5803790",
+        "model": "vitouphy/wav2vec2-xls-r-300m-timit-phoneme",
+        "subset": "test",
+        "submission_name": "fine-tuned version of facebook/wav2vec2-xls-r-300m on the Timit dataset",
+        "github_url": "https://www.kaggle.com/code/vitouphy/phoneme-recognition-with-wav2vec2",
+        "status": "completed",
+        "submitted_at": "2024-12-18T22:19:46.817373"
+    },
+    {
+        "id": "2839c0c6-8f3b-426e-9eb7-04b6e133dc47",
+        "model": "ctaguchi/wav2vec2-large-xlsr-japlmthufielta-ipa-plus-2000",
+        "subset": "test",
+        "submission_name": "wav2vec2 model",
+        "github_url": "https://huggingface.co/ctaguchi/wav2vec2-large-xlsr-japlmthufielta-ipa1000-ns",
+        "status": "completed",
+        "submitted_at": "2024-12-18T22:55:36.734691"
     }
 ]