sedrickkeh commited on
Commit
e584818
·
verified ·
1 Parent(s): 1b133ec

Training in progress, epoch 1

Browse files
model-00001-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:69bd20aa53ed14fdec51f243fe768baf6b8f5ec012411a3dde70e3705ecccd7c
3
  size 4976698672
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:505efb6f4247342454bcf409ff84e8d62592464e04f0e7f71e04b8975e8c0021
3
  size 4976698672
model-00002-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a0391a72c3ab88957410a749a8a6514e8f88c95552b9bd1738baf1c4cab711ca
3
  size 4999802720
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6e4d64219904c98a5e8e0790a6cd75f4f9c03f2c257afcfccec4b86fa1196d9d
3
  size 4999802720
model-00003-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:de2c2e9bbcfe19afa81619ac83322d2362d202a0c6bc0b0fd9663422a22ef7b1
3
  size 4915916176
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:01f7fc694f2ca43395bb4cd1ecd339dfc9a958132bad3effc18fa2f08a89e006
3
  size 4915916176
model-00004-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d543bea9d5164be53be106e3f7b9dfe5518f2fe62022a15fb46d8056cc7f21c5
3
  size 1168138808
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:12a580d2f75179cd1ccea61fe872ea6c42199938674f26ec4a958623300ef2dc
3
  size 1168138808
trainer_log.jsonl CHANGED
@@ -2,3 +2,7 @@
2
  {"current_steps": 20, "total_steps": 90, "loss": 1.0722, "lr": 5e-06, "epoch": 0.6557377049180327, "percentage": 22.22, "elapsed_time": "0:19:13", "remaining_time": "1:07:17"}
3
  {"current_steps": 30, "total_steps": 90, "loss": 1.0317, "lr": 5e-06, "epoch": 0.9836065573770492, "percentage": 33.33, "elapsed_time": "0:28:48", "remaining_time": "0:57:36"}
4
  {"current_steps": 30, "total_steps": 90, "eval_loss": 1.0128474235534668, "epoch": 0.9836065573770492, "percentage": 33.33, "elapsed_time": "0:29:42", "remaining_time": "0:59:25"}
 
 
 
 
 
2
  {"current_steps": 20, "total_steps": 90, "loss": 1.0722, "lr": 5e-06, "epoch": 0.6557377049180327, "percentage": 22.22, "elapsed_time": "0:19:13", "remaining_time": "1:07:17"}
3
  {"current_steps": 30, "total_steps": 90, "loss": 1.0317, "lr": 5e-06, "epoch": 0.9836065573770492, "percentage": 33.33, "elapsed_time": "0:28:48", "remaining_time": "0:57:36"}
4
  {"current_steps": 30, "total_steps": 90, "eval_loss": 1.0128474235534668, "epoch": 0.9836065573770492, "percentage": 33.33, "elapsed_time": "0:29:42", "remaining_time": "0:59:25"}
5
+ {"current_steps": 40, "total_steps": 90, "loss": 1.0379, "lr": 5e-06, "epoch": 1.3155737704918034, "percentage": 44.44, "elapsed_time": "0:40:04", "remaining_time": "0:50:05"}
6
+ {"current_steps": 50, "total_steps": 90, "loss": 0.952, "lr": 5e-06, "epoch": 1.6434426229508197, "percentage": 55.56, "elapsed_time": "0:49:42", "remaining_time": "0:39:45"}
7
+ {"current_steps": 60, "total_steps": 90, "loss": 0.942, "lr": 5e-06, "epoch": 1.971311475409836, "percentage": 66.67, "elapsed_time": "0:59:18", "remaining_time": "0:29:39"}
8
+ {"current_steps": 60, "total_steps": 90, "eval_loss": 0.966790497303009, "epoch": 1.971311475409836, "percentage": 66.67, "elapsed_time": "1:00:31", "remaining_time": "0:30:15"}