jasmeeetsingh commited on
Commit
1fb5c0e
·
1 Parent(s): ed12e1e

Training in progress, step 6000, checkpoint

Browse files
last-checkpoint/adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:43404aa4801c8a8f07d44770fc0ae19c928ca84485064b608bdf6cb0e8d9347a
3
  size 2384440
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:85b422ee3958e189a80805f9f965a72c206d8049b9f09de490eb890e2ce1a613
3
  size 2384440
last-checkpoint/global_step6000/zero_pp_rank_0_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:215d9ebee4db7ada43a179c37480a4bb6ffbea5b9f9ce3b025332cd422ca8aed
3
+ size 3621285613
last-checkpoint/global_step6000/zero_pp_rank_0_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f9117bd105c2a585b2a71bbe1fcda5b458785ca444cd771b854037d5c59462f2
3
+ size 3542398
last-checkpoint/global_step6000/zero_pp_rank_1_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:34be61ca15897765094e0bff9d07430873d7c70d342a48934b5c437669d8c841
3
+ size 3621285613
last-checkpoint/global_step6000/zero_pp_rank_1_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:84aadcdf820229bbb8699d3323272ce296cd085e451274879eed9f343aaa89fb
3
+ size 3542398
last-checkpoint/global_step6000/zero_pp_rank_2_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e4d0a486549934eb96c39e9240b40dc232e759778eb47182c4b6c7410a98d3b5
3
+ size 3621285613
last-checkpoint/global_step6000/zero_pp_rank_2_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:49307bef2bd400cf814aa71b5ea9ae7c5f457dae70a4151a7ba191ad05beb921
3
+ size 3542398
last-checkpoint/global_step6000/zero_pp_rank_3_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9bb775385db2832cb91fd59cf72dbd16be582202bd50ed16f73a84a5e10358a2
3
+ size 3621285613
last-checkpoint/global_step6000/zero_pp_rank_3_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6e25d262deca190648b50b5dc7b37900e05fac39325115fc6ecf745071c968f0
3
+ size 3542398
last-checkpoint/latest CHANGED
@@ -1 +1 @@
1
- global_step5000
 
1
+ global_step6000
last-checkpoint/rng_state_0.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:bbc46a1b44d90304fa6c2d97e45a09ff9ca39e2f158513357c6cbafadd965846
3
  size 17655
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d32349f4b48b9fb4729a79147fd7b83d66f0d4c2474b9f1e25ff4d1f056ed81b
3
  size 17655
last-checkpoint/rng_state_1.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:12bd87b02d242431882456ba54feb929c619932428f827859ffa31f8595a6685
3
  size 17655
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c3b1142fca547114f3d0a445f9800567d556596ee89ff6a986d92b5245f0dd93
3
  size 17655
last-checkpoint/rng_state_2.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:60503c24da7903188168982879429796e990d5059867cd1ae5b5ed86b0aa3966
3
  size 17655
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:93cde37cb441ecff6612fae913672d7d9b71d9755e386684e5be26f202a20f4d
3
  size 17655
last-checkpoint/rng_state_3.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5fc535ca2f5c6f4069ade15a885ef339906847e85c537ee37acb74a1c28d19da
3
  size 17655
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d5a1d857da05e0f9f6ddfb61aacc0dff2f758b31c8fb47768b2dafe568cfc92d
3
  size 17655
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 3.9093041438623923,
5
  "eval_steps": 500,
6
- "global_step": 5000,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -37,13 +37,19 @@
37
  "learning_rate": 0.0001,
38
  "loss": 0.4379,
39
  "step": 5000
 
 
 
 
 
 
40
  }
41
  ],
42
  "logging_steps": 1000,
43
  "max_steps": 12790,
44
  "num_train_epochs": 10,
45
  "save_steps": 1000,
46
- "total_flos": 36500817838080.0,
47
  "trial_name": null,
48
  "trial_params": null
49
  }
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 4.691164972634871,
5
  "eval_steps": 500,
6
+ "global_step": 6000,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
37
  "learning_rate": 0.0001,
38
  "loss": 0.4379,
39
  "step": 5000
40
+ },
41
+ {
42
+ "epoch": 4.69,
43
+ "learning_rate": 0.0001,
44
+ "loss": 0.4208,
45
+ "step": 6000
46
  }
47
  ],
48
  "logging_steps": 1000,
49
  "max_steps": 12790,
50
  "num_train_epochs": 10,
51
  "save_steps": 1000,
52
+ "total_flos": 43787607343104.0,
53
  "trial_name": null,
54
  "trial_params": null
55
  }