jun-han commited on
Commit
7f42f6d
·
verified ·
1 Parent(s): bc77b7f

Training checkpoint

Browse files
Files changed (2) hide show
  1. README.md +8 -6
  2. trainer_state.json +44 -12
README.md CHANGED
@@ -1,22 +1,24 @@
1
  ---
2
- base_model: openai/whisper-small
3
  library_name: transformers
 
 
4
  license: apache-2.0
5
- metrics:
6
- - wer
7
  tags:
8
  - generated_from_trainer
 
 
9
  model-index:
10
- - name: Whisper-squeezeformer-v3
11
  results: []
12
  ---
13
 
14
  <!-- This model card has been generated automatically according to the information the Trainer had access to. You
15
  should probably proofread and complete it, then remove this comment. -->
16
 
17
- # Whisper-squeezeformer-v3
18
 
19
- This model is a fine-tuned version of [openai/whisper-small](https://huggingface.co/openai/whisper-small) on the None dataset.
20
  It achieves the following results on the evaluation set:
21
  - Loss: 0.1322
22
  - Wer: 5.6642
 
1
  ---
 
2
  library_name: transformers
3
+ language:
4
+ - en
5
  license: apache-2.0
6
+ base_model: openai/whisper-small
 
7
  tags:
8
  - generated_from_trainer
9
+ metrics:
10
+ - wer
11
  model-index:
12
+ - name: Whisper-squeezeformer-NSQU-whisper
13
  results: []
14
  ---
15
 
16
  <!-- This model card has been generated automatically according to the information the Trainer had access to. You
17
  should probably proofread and complete it, then remove this comment. -->
18
 
19
+ # Whisper-squeezeformer-NSQU-whisper
20
 
21
+ This model is a fine-tuned version of [openai/whisper-small](https://huggingface.co/openai/whisper-small) on the LibriSpeech dataset.
22
  It achieves the following results on the evaluation set:
23
  - Loss: 0.1322
24
  - Wer: 5.6642
trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": 5.599513085818624,
3
  "best_model_checkpoint": "./Whisper-squeezeformer-v3\\checkpoint-40000",
4
- "epoch": 18.0,
5
  "eval_steps": 2500,
6
- "global_step": 45000,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -297,19 +297,51 @@
297
  "step": 45000
298
  },
299
  {
300
- "epoch": 18.0,
301
- "step": 45000,
302
- "total_flos": 3.11981580288e+20,
303
- "train_loss": 0.024614295111762153,
304
- "train_runtime": 36051.4679,
305
- "train_samples_per_second": 24.964,
306
- "train_steps_per_second": 1.248
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
307
  }
308
  ],
309
  "logging_steps": 2500,
310
- "max_steps": 45000,
311
  "num_input_tokens_seen": 0,
312
- "num_train_epochs": 18,
313
  "save_steps": 2500,
314
  "stateful_callbacks": {
315
  "TrainerControl": {
@@ -323,7 +355,7 @@
323
  "attributes": {}
324
  }
325
  },
326
- "total_flos": 3.11981580288e+20,
327
  "train_batch_size": 20,
328
  "trial_name": null,
329
  "trial_params": null
 
1
  {
2
  "best_metric": 5.599513085818624,
3
  "best_model_checkpoint": "./Whisper-squeezeformer-v3\\checkpoint-40000",
4
+ "epoch": 20.0,
5
  "eval_steps": 2500,
6
+ "global_step": 50000,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
297
  "step": 45000
298
  },
299
  {
300
+ "epoch": 19.0,
301
+ "grad_norm": 4.747838973999023,
302
+ "learning_rate": 5.309473684210527e-07,
303
+ "loss": 0.3373,
304
+ "step": 47500
305
+ },
306
+ {
307
+ "epoch": 19.0,
308
+ "eval_loss": 0.13534972071647644,
309
+ "eval_runtime": 649.9396,
310
+ "eval_samples_per_second": 4.031,
311
+ "eval_steps_per_second": 0.505,
312
+ "eval_wer": 5.740261716372489,
313
+ "step": 47500
314
+ },
315
+ {
316
+ "epoch": 20.0,
317
+ "grad_norm": 5.997547626495361,
318
+ "learning_rate": 4.842105263157895e-09,
319
+ "loss": 0.2785,
320
+ "step": 50000
321
+ },
322
+ {
323
+ "epoch": 20.0,
324
+ "eval_loss": 0.13221722841262817,
325
+ "eval_runtime": 634.989,
326
+ "eval_samples_per_second": 4.126,
327
+ "eval_steps_per_second": 0.517,
328
+ "eval_wer": 5.6641813755325625,
329
+ "step": 50000
330
+ },
331
+ {
332
+ "epoch": 20.0,
333
+ "step": 50000,
334
+ "total_flos": 3.4664620032e+20,
335
+ "train_loss": 0.030787386474609376,
336
+ "train_runtime": 24493.4093,
337
+ "train_samples_per_second": 40.827,
338
+ "train_steps_per_second": 2.041
339
  }
340
  ],
341
  "logging_steps": 2500,
342
+ "max_steps": 50000,
343
  "num_input_tokens_seen": 0,
344
+ "num_train_epochs": 20,
345
  "save_steps": 2500,
346
  "stateful_callbacks": {
347
  "TrainerControl": {
 
355
  "attributes": {}
356
  }
357
  },
358
+ "total_flos": 3.4664620032e+20,
359
  "train_batch_size": 20,
360
  "trial_name": null,
361
  "trial_params": null