jssky commited on
Commit
407024f
·
verified ·
1 Parent(s): a5d2e6e

Training in progress, step 10, checkpoint

Browse files
last-checkpoint/adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1623d6b3a59c7a32c66f828a169ca71f7b735b77b2c6a27858726a06327cfc22
3
  size 130583912
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d757243f503344b7811431b04ed26faa173948ed9e56ea963ca55e8e7e4bc03b
3
  size 130583912
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:cf789c0a027087f7c384511e444dce2b20eb558b0d64f3b76f6360736ca67bb3
3
  size 66578772
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0cfc89fc11ed4c15cb339f27a6743d01d0200f8327c89f05ae72c424ab687e25
3
  size 66578772
last-checkpoint/rng_state_0.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8d63289c5d04f2383b71ba99ab7652862b29466628d679a7f2b02d0fcdcc4da0
3
  size 15984
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8bf6413e852be2cf688208c1704f913e5832da44d4c80b17ec9583f98fb0864c
3
  size 15984
last-checkpoint/rng_state_1.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:93154ab653dd9adc62e305cb44be3d4cf8f6f7370124d22ce262388fdd3f16b5
3
  size 15984
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1e4e1e3668e91b54a58da1ce6f5c7e6b1553629081e2ee6e6ec89e9df4de7128
3
  size 15984
last-checkpoint/rng_state_2.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:edad8284ff84b94ec708b9eb257b9d770d3adef066494f245cf2c51dc659164b
3
  size 15984
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dabebd1c16ad1482a9b6ac36cbcd94d2fb8623833ce700c649442aab5592f63c
3
  size 15984
last-checkpoint/rng_state_3.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f9c8dbb46a9a74fc09c0eb4d787c118be17c860af785749c012382f79fbc9121
3
  size 15984
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:422a5e7e7660c4a9fddfbb53556696d7909d580ade84163abb00a59311819365
3
  size 15984
last-checkpoint/rng_state_4.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:009402242046e588b30763e69f21be1c7fde9c10c17467c4a20db57ff0c78e87
3
  size 15984
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:eb732cb1b72b02838d9caad609515135e7638548c69ee64a18f63b8eef2b048f
3
  size 15984
last-checkpoint/rng_state_5.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1ba0c0bd9979cfe74fa236eb5a2e4c12f3ea24dd8cbe5225eb3f303941c44c3c
3
  size 15984
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cb63466a5bcf657473f2d960e277d4cbcc0a9c4a1e451be5d373a79f8fc4196f
3
  size 15984
last-checkpoint/rng_state_6.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:33bf9a4ef7c0b20ceeaa1cbd1bacae415bdb21876893a2072dc934f8a9da7b5d
3
  size 15984
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:61e5883f037f93f02b6a025b5cb7d945d09d8e29f914292c468c9e4e008a85ce
3
  size 15984
last-checkpoint/rng_state_7.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:75a57d3dbd028d4822c84de2623c8b1fedf5f921d0a089d23fb7b9b24235a874
3
  size 15984
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f387686327168eef8043d717153998c55445f4ab3f6ae746687ee9f06afb96ec
3
  size 15984
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8bdda546a1390be3b85a90dd4ef31050dfb7b691765ffc12ed691b6786ed6e3d
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:26a93b2a1f4b5368650119fe6e0d6eec6d19cda6badeba4d21943ab48964fa00
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 0.18,
5
  "eval_steps": 3,
6
- "global_step": 9,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -102,6 +102,13 @@
102
  "eval_samples_per_second": 28.601,
103
  "eval_steps_per_second": 3.745,
104
  "step": 9
 
 
 
 
 
 
 
105
  }
106
  ],
107
  "logging_steps": 1,
@@ -116,12 +123,12 @@
116
  "should_evaluate": false,
117
  "should_log": false,
118
  "should_save": true,
119
- "should_training_stop": false
120
  },
121
  "attributes": {}
122
  }
123
  },
124
- "total_flos": 4.713086603545805e+16,
125
  "train_batch_size": 1,
126
  "trial_name": null,
127
  "trial_params": null
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 0.2,
5
  "eval_steps": 3,
6
+ "global_step": 10,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
102
  "eval_samples_per_second": 28.601,
103
  "eval_steps_per_second": 3.745,
104
  "step": 9
105
+ },
106
+ {
107
+ "epoch": 0.2,
108
+ "grad_norm": 48.75463104248047,
109
+ "learning_rate": 0.00016,
110
+ "loss": 8.6251,
111
+ "step": 10
112
  }
113
  ],
114
  "logging_steps": 1,
 
123
  "should_evaluate": false,
124
  "should_log": false,
125
  "should_save": true,
126
+ "should_training_stop": true
127
  },
128
  "attributes": {}
129
  }
130
  },
131
+ "total_flos": 5.236762892828672e+16,
132
  "train_batch_size": 1,
133
  "trial_name": null,
134
  "trial_params": null