jssky commited on
Commit
8e0699d
·
verified ·
1 Parent(s): 152e2a2

Training in progress, step 10, checkpoint

Browse files
last-checkpoint/rng_state_0.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f037179e2f72f8052c567935428a2b336875a279f6a258c94c81c6eda52ca9a7
3
  size 15984
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f2fa24c4825fb5ace55febf56297d1150b3b471c4fc3043c4851bdd99ffc5d89
3
  size 15984
last-checkpoint/rng_state_1.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:095e7bf64776870b00aad21b5d20fedc85a0ea0239296af560cd4be957fbf562
3
  size 15984
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3549c96bd60bb982e68c0be3129dc3dbe867ae6b87e9dc28044275954eedaa2d
3
  size 15984
last-checkpoint/rng_state_2.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4c7ea82e6f493a6775b5a4cd8618f2ddb43db4405ab77c46f046a09ea763e869
3
  size 15984
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:892d0cd8183310f54e678688c542970f37dacb6814ec43f56469182baaaac839
3
  size 15984
last-checkpoint/rng_state_3.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d74456313175ad9b8126678aa9443bfe6356fb4c5d663a059450d3f27587e784
3
  size 15984
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ee36c46891b55b11e5b7ce52eedb64259983bfdbe01c3a5cc6e08e4f3dc2f194
3
  size 15984
last-checkpoint/rng_state_4.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:14afc2d953ce2b165f4da7b4bca19afec155ff1d5805a54379b64f4c34bfd6a9
3
  size 15984
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2ef6548f94857c9961033ae9d5ceae860f3593140487086dd5476df0b3b94989
3
  size 15984
last-checkpoint/rng_state_5.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ed57cfed487b9d17510809e80ef03db1018bf9797a8332cd83d8598a8bf8276d
3
  size 15984
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:abbec5a34841b8316b91c87aa3201a151f3f41f0cc7ca6db01946c3014aed018
3
  size 15984
last-checkpoint/rng_state_6.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f9ca5a0af0b68b10972e265eafc5246b223cb21b68105b011c346e7cb46fee64
3
  size 15984
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f8aef7c8b7b765ec5a013bd6cd56902e24a39aeb73f446b8e23107edd8ca8805
3
  size 15984
last-checkpoint/rng_state_7.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c8061970669cd0d8e3da8a8bb44cab4dd909f46d3ec4e8db91363c4c8a1e4dc2
3
  size 15984
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cd83becaa5b096db0939dcb563d1b8ddcee21ec864352cec465ce739a1b9381e
3
  size 15984
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 0.014516129032258065,
5
  "eval_steps": 3,
6
- "global_step": 9,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -102,6 +102,13 @@
102
  "eval_samples_per_second": 43.725,
103
  "eval_steps_per_second": 5.487,
104
  "step": 9
 
 
 
 
 
 
 
105
  }
106
  ],
107
  "logging_steps": 1,
@@ -116,12 +123,12 @@
116
  "should_evaluate": false,
117
  "should_log": false,
118
  "should_save": true,
119
- "should_training_stop": false
120
  },
121
  "attributes": {}
122
  }
123
  },
124
- "total_flos": 2.655951538618368e+16,
125
  "train_batch_size": 1,
126
  "trial_name": null,
127
  "trial_params": null
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 0.016129032258064516,
5
  "eval_steps": 3,
6
+ "global_step": 10,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
102
  "eval_samples_per_second": 43.725,
103
  "eval_steps_per_second": 5.487,
104
  "step": 9
105
+ },
106
+ {
107
+ "epoch": 0.016129032258064516,
108
+ "grad_norm": NaN,
109
+ "learning_rate": 0.0,
110
+ "loss": 9.5635,
111
+ "step": 10
112
  }
113
  ],
114
  "logging_steps": 1,
 
123
  "should_evaluate": false,
124
  "should_log": false,
125
  "should_save": true,
126
+ "should_training_stop": true
127
  },
128
  "attributes": {}
129
  }
130
  },
131
+ "total_flos": 2.95105726513152e+16,
132
  "train_batch_size": 1,
133
  "trial_name": null,
134
  "trial_params": null