youdiniplays commited on
Commit
68da59c
·
verified ·
1 Parent(s): 057474c

Training in progress, step 11500, checkpoint

Browse files
last-checkpoint/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:70f5fee0b4112dd0db7e86095d48cbf6893b4dfe629a726d3abec8b8e2a1e10e
3
  size 242041896
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:214e311a786637414b3cc77ddd784b3f3a41fb5e3fc116ca8b692dcad6f03aca
3
  size 242041896
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:55cf6ab4ba17f036690d4af65be07e56e29c571fd2cc7031d5670680d7d25984
3
  size 484163514
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b0091a67a2288f1e898b6efef5db7f93d4e8d8e86728f655273466e0a268c494
3
  size 484163514
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ef2206456a634e56b39f3abcefa5202e78b92d2807bd2e21d857de54a68f5836
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2db5a10ae8e077eb948f8a65081b04034858b4b0907d0313398fe4a4657c1c44
3
  size 14244
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f64d2100afc2fdeadb9c22cbe8a60fda4e0d6fbe329ea52789fdd94b44f49658
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:855b6253cf532e5dd8b357f2552ac3d9f831efc883e202dbd75e2be7a6e1687d
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 1.6881522406384284,
5
  "eval_steps": 500,
6
- "global_step": 11000,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -149,13 +149,19 @@
149
  "learning_rate": 0.0006624923265807244,
150
  "loss": 0.5694,
151
  "step": 11000
 
 
 
 
 
 
152
  }
153
  ],
154
  "logging_steps": 500,
155
  "max_steps": 32580,
156
  "num_train_epochs": 5,
157
  "save_steps": 500,
158
- "total_flos": 5832639523061760.0,
159
  "trial_name": null,
160
  "trial_params": null
161
  }
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 1.7648864333947207,
5
  "eval_steps": 500,
6
+ "global_step": 11500,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
149
  "learning_rate": 0.0006624923265807244,
150
  "loss": 0.5694,
151
  "step": 11000
152
+ },
153
+ {
154
+ "epoch": 1.76,
155
+ "learning_rate": 0.0006471454880294659,
156
+ "loss": 0.5716,
157
+ "step": 11500
158
  }
159
  ],
160
  "logging_steps": 500,
161
  "max_steps": 32580,
162
  "num_train_epochs": 5,
163
  "save_steps": 500,
164
+ "total_flos": 6096687148302336.0,
165
  "trial_name": null,
166
  "trial_params": null
167
  }