Upload folder using huggingface_hub
Browse files- adapter_config.json +2 -2
- adapter_model.safetensors +1 -1
- checkpoint-10/adapter_config.json +2 -2
- checkpoint-10/adapter_model.safetensors +1 -1
- checkpoint-10/optimizer.pt +1 -1
- checkpoint-10/trainer_state.json +2 -2
- checkpoint-10/training_args.bin +1 -1
- checkpoint-20/adapter_config.json +2 -2
- checkpoint-20/adapter_model.safetensors +1 -1
- checkpoint-20/optimizer.pt +1 -1
- checkpoint-20/trainer_state.json +4 -4
- checkpoint-20/training_args.bin +1 -1
- checkpoint-30/adapter_config.json +2 -2
- checkpoint-30/adapter_model.safetensors +1 -1
- checkpoint-30/optimizer.pt +1 -1
- checkpoint-30/trainer_state.json +6 -6
- checkpoint-30/training_args.bin +1 -1
- checkpoint-40/adapter_config.json +2 -2
- checkpoint-40/adapter_model.safetensors +1 -1
- checkpoint-40/optimizer.pt +1 -1
- checkpoint-40/trainer_state.json +8 -8
- checkpoint-40/training_args.bin +1 -1
- checkpoint-50/adapter_config.json +2 -2
- checkpoint-50/adapter_model.safetensors +1 -1
- checkpoint-50/optimizer.pt +1 -1
- checkpoint-50/trainer_state.json +10 -10
- checkpoint-50/training_args.bin +1 -1
- checkpoint-60/adapter_config.json +2 -2
- checkpoint-60/adapter_model.safetensors +1 -1
- checkpoint-60/optimizer.pt +1 -1
- checkpoint-60/trainer_state.json +12 -12
- checkpoint-60/training_args.bin +1 -1
- checkpoint-70/adapter_config.json +2 -2
- checkpoint-70/adapter_model.safetensors +1 -1
- checkpoint-70/optimizer.pt +1 -1
- checkpoint-70/trainer_state.json +14 -14
- checkpoint-70/training_args.bin +1 -1
- checkpoint-72/adapter_config.json +2 -2
- checkpoint-72/adapter_model.safetensors +1 -1
- checkpoint-72/optimizer.pt +1 -1
- checkpoint-72/trainer_state.json +14 -14
- checkpoint-72/training_args.bin +1 -1
adapter_config.json
CHANGED
@@ -20,8 +20,8 @@
|
|
20 |
"rank_pattern": {},
|
21 |
"revision": null,
|
22 |
"target_modules": [
|
23 |
-
"
|
24 |
-
"
|
25 |
],
|
26 |
"task_type": "CAUSAL_LM",
|
27 |
"use_dora": false,
|
|
|
20 |
"rank_pattern": {},
|
21 |
"revision": null,
|
22 |
"target_modules": [
|
23 |
+
"q_proj",
|
24 |
+
"v_proj"
|
25 |
],
|
26 |
"task_type": "CAUSAL_LM",
|
27 |
"use_dora": false,
|
adapter_model.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 6832600
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:089e9b02962974c75c6049905f2ab2ce48248b37664b9f385cca31095074a258
|
3 |
size 6832600
|
checkpoint-10/adapter_config.json
CHANGED
@@ -20,8 +20,8 @@
|
|
20 |
"rank_pattern": {},
|
21 |
"revision": null,
|
22 |
"target_modules": [
|
23 |
-
"
|
24 |
-
"
|
25 |
],
|
26 |
"task_type": "CAUSAL_LM",
|
27 |
"use_dora": false,
|
|
|
20 |
"rank_pattern": {},
|
21 |
"revision": null,
|
22 |
"target_modules": [
|
23 |
+
"q_proj",
|
24 |
+
"v_proj"
|
25 |
],
|
26 |
"task_type": "CAUSAL_LM",
|
27 |
"use_dora": false,
|
checkpoint-10/adapter_model.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 6832600
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fb6239c4d573eb2621ff10ad222da14f996c8d2f3390a0d3f7cf6fc3cc303933
|
3 |
size 6832600
|
checkpoint-10/optimizer.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 27338682
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:09d973c62bd97ddb6cba001ce0ce6e8ab3627ab738820551fed79860e1fbe433
|
3 |
size 27338682
|
checkpoint-10/trainer_state.json
CHANGED
@@ -10,9 +10,9 @@
|
|
10 |
"log_history": [
|
11 |
{
|
12 |
"epoch": 0.13745704467353953,
|
13 |
-
"grad_norm": 2.
|
14 |
"learning_rate": 0.0002,
|
15 |
-
"loss": 2.
|
16 |
"step": 10
|
17 |
}
|
18 |
],
|
|
|
10 |
"log_history": [
|
11 |
{
|
12 |
"epoch": 0.13745704467353953,
|
13 |
+
"grad_norm": 2.5390625,
|
14 |
"learning_rate": 0.0002,
|
15 |
+
"loss": 2.5496,
|
16 |
"step": 10
|
17 |
}
|
18 |
],
|
checkpoint-10/training_args.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 5304
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:540f901f89791921e9b3cf9ab4587377c091add791e4fe4b6656820764ebd035
|
3 |
size 5304
|
checkpoint-20/adapter_config.json
CHANGED
@@ -20,8 +20,8 @@
|
|
20 |
"rank_pattern": {},
|
21 |
"revision": null,
|
22 |
"target_modules": [
|
23 |
-
"
|
24 |
-
"
|
25 |
],
|
26 |
"task_type": "CAUSAL_LM",
|
27 |
"use_dora": false,
|
|
|
20 |
"rank_pattern": {},
|
21 |
"revision": null,
|
22 |
"target_modules": [
|
23 |
+
"q_proj",
|
24 |
+
"v_proj"
|
25 |
],
|
26 |
"task_type": "CAUSAL_LM",
|
27 |
"use_dora": false,
|
checkpoint-20/adapter_model.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 6832600
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:df8ec53bf646e3db4650fe8d85776edeeaa740c75069ff07c904891c4a1edf60
|
3 |
size 6832600
|
checkpoint-20/optimizer.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 27338682
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e0cd3d5e3b70abcc506047a384469b16e5ad770b0aafc11942ce45b90071e873
|
3 |
size 27338682
|
checkpoint-20/trainer_state.json
CHANGED
@@ -10,16 +10,16 @@
|
|
10 |
"log_history": [
|
11 |
{
|
12 |
"epoch": 0.13745704467353953,
|
13 |
-
"grad_norm": 2.
|
14 |
"learning_rate": 0.0002,
|
15 |
-
"loss": 2.
|
16 |
"step": 10
|
17 |
},
|
18 |
{
|
19 |
"epoch": 0.27491408934707906,
|
20 |
-
"grad_norm": 1.
|
21 |
"learning_rate": 0.0002,
|
22 |
-
"loss": 1.
|
23 |
"step": 20
|
24 |
}
|
25 |
],
|
|
|
10 |
"log_history": [
|
11 |
{
|
12 |
"epoch": 0.13745704467353953,
|
13 |
+
"grad_norm": 2.5390625,
|
14 |
"learning_rate": 0.0002,
|
15 |
+
"loss": 2.5496,
|
16 |
"step": 10
|
17 |
},
|
18 |
{
|
19 |
"epoch": 0.27491408934707906,
|
20 |
+
"grad_norm": 1.5771484375,
|
21 |
"learning_rate": 0.0002,
|
22 |
+
"loss": 1.1222,
|
23 |
"step": 20
|
24 |
}
|
25 |
],
|
checkpoint-20/training_args.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 5304
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:540f901f89791921e9b3cf9ab4587377c091add791e4fe4b6656820764ebd035
|
3 |
size 5304
|
checkpoint-30/adapter_config.json
CHANGED
@@ -20,8 +20,8 @@
|
|
20 |
"rank_pattern": {},
|
21 |
"revision": null,
|
22 |
"target_modules": [
|
23 |
-
"
|
24 |
-
"
|
25 |
],
|
26 |
"task_type": "CAUSAL_LM",
|
27 |
"use_dora": false,
|
|
|
20 |
"rank_pattern": {},
|
21 |
"revision": null,
|
22 |
"target_modules": [
|
23 |
+
"q_proj",
|
24 |
+
"v_proj"
|
25 |
],
|
26 |
"task_type": "CAUSAL_LM",
|
27 |
"use_dora": false,
|
checkpoint-30/adapter_model.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 6832600
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5bbef078d5c140677a5a69f6fa6864a8f631586a67f0f227afc470387f0dc1f5
|
3 |
size 6832600
|
checkpoint-30/optimizer.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 27338682
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:497b526615ff07addd479c1b072efce207d8c3db3ff2d9bf8dc5d62f66fb72b0
|
3 |
size 27338682
|
checkpoint-30/trainer_state.json
CHANGED
@@ -10,23 +10,23 @@
|
|
10 |
"log_history": [
|
11 |
{
|
12 |
"epoch": 0.13745704467353953,
|
13 |
-
"grad_norm": 2.
|
14 |
"learning_rate": 0.0002,
|
15 |
-
"loss": 2.
|
16 |
"step": 10
|
17 |
},
|
18 |
{
|
19 |
"epoch": 0.27491408934707906,
|
20 |
-
"grad_norm": 1.
|
21 |
"learning_rate": 0.0002,
|
22 |
-
"loss": 1.
|
23 |
"step": 20
|
24 |
},
|
25 |
{
|
26 |
"epoch": 0.41237113402061853,
|
27 |
-
"grad_norm": 0.
|
28 |
"learning_rate": 0.0002,
|
29 |
-
"loss": 0.
|
30 |
"step": 30
|
31 |
}
|
32 |
],
|
|
|
10 |
"log_history": [
|
11 |
{
|
12 |
"epoch": 0.13745704467353953,
|
13 |
+
"grad_norm": 2.5390625,
|
14 |
"learning_rate": 0.0002,
|
15 |
+
"loss": 2.5496,
|
16 |
"step": 10
|
17 |
},
|
18 |
{
|
19 |
"epoch": 0.27491408934707906,
|
20 |
+
"grad_norm": 1.5771484375,
|
21 |
"learning_rate": 0.0002,
|
22 |
+
"loss": 1.1222,
|
23 |
"step": 20
|
24 |
},
|
25 |
{
|
26 |
"epoch": 0.41237113402061853,
|
27 |
+
"grad_norm": 0.66748046875,
|
28 |
"learning_rate": 0.0002,
|
29 |
+
"loss": 0.5563,
|
30 |
"step": 30
|
31 |
}
|
32 |
],
|
checkpoint-30/training_args.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 5304
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:540f901f89791921e9b3cf9ab4587377c091add791e4fe4b6656820764ebd035
|
3 |
size 5304
|
checkpoint-40/adapter_config.json
CHANGED
@@ -20,8 +20,8 @@
|
|
20 |
"rank_pattern": {},
|
21 |
"revision": null,
|
22 |
"target_modules": [
|
23 |
-
"
|
24 |
-
"
|
25 |
],
|
26 |
"task_type": "CAUSAL_LM",
|
27 |
"use_dora": false,
|
|
|
20 |
"rank_pattern": {},
|
21 |
"revision": null,
|
22 |
"target_modules": [
|
23 |
+
"q_proj",
|
24 |
+
"v_proj"
|
25 |
],
|
26 |
"task_type": "CAUSAL_LM",
|
27 |
"use_dora": false,
|
checkpoint-40/adapter_model.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 6832600
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8ee136b35ecab263229c2a5cc09588a2b068195ab08b4f35eb04aee51785dd1d
|
3 |
size 6832600
|
checkpoint-40/optimizer.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 27338682
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f1f6ce72b6125275a965c4c78490086feb151bf209fb9bcec0f10991bedb30c1
|
3 |
size 27338682
|
checkpoint-40/trainer_state.json
CHANGED
@@ -10,30 +10,30 @@
|
|
10 |
"log_history": [
|
11 |
{
|
12 |
"epoch": 0.13745704467353953,
|
13 |
-
"grad_norm": 2.
|
14 |
"learning_rate": 0.0002,
|
15 |
-
"loss": 2.
|
16 |
"step": 10
|
17 |
},
|
18 |
{
|
19 |
"epoch": 0.27491408934707906,
|
20 |
-
"grad_norm": 1.
|
21 |
"learning_rate": 0.0002,
|
22 |
-
"loss": 1.
|
23 |
"step": 20
|
24 |
},
|
25 |
{
|
26 |
"epoch": 0.41237113402061853,
|
27 |
-
"grad_norm": 0.
|
28 |
"learning_rate": 0.0002,
|
29 |
-
"loss": 0.
|
30 |
"step": 30
|
31 |
},
|
32 |
{
|
33 |
"epoch": 0.5498281786941581,
|
34 |
-
"grad_norm": 0.
|
35 |
"learning_rate": 0.0002,
|
36 |
-
"loss": 0.
|
37 |
"step": 40
|
38 |
}
|
39 |
],
|
|
|
10 |
"log_history": [
|
11 |
{
|
12 |
"epoch": 0.13745704467353953,
|
13 |
+
"grad_norm": 2.5390625,
|
14 |
"learning_rate": 0.0002,
|
15 |
+
"loss": 2.5496,
|
16 |
"step": 10
|
17 |
},
|
18 |
{
|
19 |
"epoch": 0.27491408934707906,
|
20 |
+
"grad_norm": 1.5771484375,
|
21 |
"learning_rate": 0.0002,
|
22 |
+
"loss": 1.1222,
|
23 |
"step": 20
|
24 |
},
|
25 |
{
|
26 |
"epoch": 0.41237113402061853,
|
27 |
+
"grad_norm": 0.66748046875,
|
28 |
"learning_rate": 0.0002,
|
29 |
+
"loss": 0.5563,
|
30 |
"step": 30
|
31 |
},
|
32 |
{
|
33 |
"epoch": 0.5498281786941581,
|
34 |
+
"grad_norm": 0.6455078125,
|
35 |
"learning_rate": 0.0002,
|
36 |
+
"loss": 0.5064,
|
37 |
"step": 40
|
38 |
}
|
39 |
],
|
checkpoint-40/training_args.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 5304
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:540f901f89791921e9b3cf9ab4587377c091add791e4fe4b6656820764ebd035
|
3 |
size 5304
|
checkpoint-50/adapter_config.json
CHANGED
@@ -20,8 +20,8 @@
|
|
20 |
"rank_pattern": {},
|
21 |
"revision": null,
|
22 |
"target_modules": [
|
23 |
-
"
|
24 |
-
"
|
25 |
],
|
26 |
"task_type": "CAUSAL_LM",
|
27 |
"use_dora": false,
|
|
|
20 |
"rank_pattern": {},
|
21 |
"revision": null,
|
22 |
"target_modules": [
|
23 |
+
"q_proj",
|
24 |
+
"v_proj"
|
25 |
],
|
26 |
"task_type": "CAUSAL_LM",
|
27 |
"use_dora": false,
|
checkpoint-50/adapter_model.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 6832600
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0cb9a4e2b8ffc1bbde07b3cc8314ca0f3451a017154b8438581e6289557d03bc
|
3 |
size 6832600
|
checkpoint-50/optimizer.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 27338682
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:88990edb9dc7bf5ed1ed1ca9f5cfef074535755129f1547e954f359832c42436
|
3 |
size 27338682
|
checkpoint-50/trainer_state.json
CHANGED
@@ -10,37 +10,37 @@
|
|
10 |
"log_history": [
|
11 |
{
|
12 |
"epoch": 0.13745704467353953,
|
13 |
-
"grad_norm": 2.
|
14 |
"learning_rate": 0.0002,
|
15 |
-
"loss": 2.
|
16 |
"step": 10
|
17 |
},
|
18 |
{
|
19 |
"epoch": 0.27491408934707906,
|
20 |
-
"grad_norm": 1.
|
21 |
"learning_rate": 0.0002,
|
22 |
-
"loss": 1.
|
23 |
"step": 20
|
24 |
},
|
25 |
{
|
26 |
"epoch": 0.41237113402061853,
|
27 |
-
"grad_norm": 0.
|
28 |
"learning_rate": 0.0002,
|
29 |
-
"loss": 0.
|
30 |
"step": 30
|
31 |
},
|
32 |
{
|
33 |
"epoch": 0.5498281786941581,
|
34 |
-
"grad_norm": 0.
|
35 |
"learning_rate": 0.0002,
|
36 |
-
"loss": 0.
|
37 |
"step": 40
|
38 |
},
|
39 |
{
|
40 |
"epoch": 0.6872852233676976,
|
41 |
-
"grad_norm": 0.
|
42 |
"learning_rate": 0.0002,
|
43 |
-
"loss": 0.
|
44 |
"step": 50
|
45 |
}
|
46 |
],
|
|
|
10 |
"log_history": [
|
11 |
{
|
12 |
"epoch": 0.13745704467353953,
|
13 |
+
"grad_norm": 2.5390625,
|
14 |
"learning_rate": 0.0002,
|
15 |
+
"loss": 2.5496,
|
16 |
"step": 10
|
17 |
},
|
18 |
{
|
19 |
"epoch": 0.27491408934707906,
|
20 |
+
"grad_norm": 1.5771484375,
|
21 |
"learning_rate": 0.0002,
|
22 |
+
"loss": 1.1222,
|
23 |
"step": 20
|
24 |
},
|
25 |
{
|
26 |
"epoch": 0.41237113402061853,
|
27 |
+
"grad_norm": 0.66748046875,
|
28 |
"learning_rate": 0.0002,
|
29 |
+
"loss": 0.5563,
|
30 |
"step": 30
|
31 |
},
|
32 |
{
|
33 |
"epoch": 0.5498281786941581,
|
34 |
+
"grad_norm": 0.6455078125,
|
35 |
"learning_rate": 0.0002,
|
36 |
+
"loss": 0.5064,
|
37 |
"step": 40
|
38 |
},
|
39 |
{
|
40 |
"epoch": 0.6872852233676976,
|
41 |
+
"grad_norm": 0.62451171875,
|
42 |
"learning_rate": 0.0002,
|
43 |
+
"loss": 0.4592,
|
44 |
"step": 50
|
45 |
}
|
46 |
],
|
checkpoint-50/training_args.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 5304
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:540f901f89791921e9b3cf9ab4587377c091add791e4fe4b6656820764ebd035
|
3 |
size 5304
|
checkpoint-60/adapter_config.json
CHANGED
@@ -20,8 +20,8 @@
|
|
20 |
"rank_pattern": {},
|
21 |
"revision": null,
|
22 |
"target_modules": [
|
23 |
-
"
|
24 |
-
"
|
25 |
],
|
26 |
"task_type": "CAUSAL_LM",
|
27 |
"use_dora": false,
|
|
|
20 |
"rank_pattern": {},
|
21 |
"revision": null,
|
22 |
"target_modules": [
|
23 |
+
"q_proj",
|
24 |
+
"v_proj"
|
25 |
],
|
26 |
"task_type": "CAUSAL_LM",
|
27 |
"use_dora": false,
|
checkpoint-60/adapter_model.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 6832600
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2d3da5b893f53b71e42667360590d0303a5cabec2b19c4680677d3ba2fe6fa2b
|
3 |
size 6832600
|
checkpoint-60/optimizer.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 27338682
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:aa9325ece40d56ecf5c322ed8294ea76437847de82c3847b4fdebe3aeb5c401c
|
3 |
size 27338682
|
checkpoint-60/trainer_state.json
CHANGED
@@ -10,44 +10,44 @@
|
|
10 |
"log_history": [
|
11 |
{
|
12 |
"epoch": 0.13745704467353953,
|
13 |
-
"grad_norm": 2.
|
14 |
"learning_rate": 0.0002,
|
15 |
-
"loss": 2.
|
16 |
"step": 10
|
17 |
},
|
18 |
{
|
19 |
"epoch": 0.27491408934707906,
|
20 |
-
"grad_norm": 1.
|
21 |
"learning_rate": 0.0002,
|
22 |
-
"loss": 1.
|
23 |
"step": 20
|
24 |
},
|
25 |
{
|
26 |
"epoch": 0.41237113402061853,
|
27 |
-
"grad_norm": 0.
|
28 |
"learning_rate": 0.0002,
|
29 |
-
"loss": 0.
|
30 |
"step": 30
|
31 |
},
|
32 |
{
|
33 |
"epoch": 0.5498281786941581,
|
34 |
-
"grad_norm": 0.
|
35 |
"learning_rate": 0.0002,
|
36 |
-
"loss": 0.
|
37 |
"step": 40
|
38 |
},
|
39 |
{
|
40 |
"epoch": 0.6872852233676976,
|
41 |
-
"grad_norm": 0.
|
42 |
"learning_rate": 0.0002,
|
43 |
-
"loss": 0.
|
44 |
"step": 50
|
45 |
},
|
46 |
{
|
47 |
"epoch": 0.8247422680412371,
|
48 |
-
"grad_norm": 0.
|
49 |
"learning_rate": 0.0002,
|
50 |
-
"loss": 0.
|
51 |
"step": 60
|
52 |
}
|
53 |
],
|
|
|
10 |
"log_history": [
|
11 |
{
|
12 |
"epoch": 0.13745704467353953,
|
13 |
+
"grad_norm": 2.5390625,
|
14 |
"learning_rate": 0.0002,
|
15 |
+
"loss": 2.5496,
|
16 |
"step": 10
|
17 |
},
|
18 |
{
|
19 |
"epoch": 0.27491408934707906,
|
20 |
+
"grad_norm": 1.5771484375,
|
21 |
"learning_rate": 0.0002,
|
22 |
+
"loss": 1.1222,
|
23 |
"step": 20
|
24 |
},
|
25 |
{
|
26 |
"epoch": 0.41237113402061853,
|
27 |
+
"grad_norm": 0.66748046875,
|
28 |
"learning_rate": 0.0002,
|
29 |
+
"loss": 0.5563,
|
30 |
"step": 30
|
31 |
},
|
32 |
{
|
33 |
"epoch": 0.5498281786941581,
|
34 |
+
"grad_norm": 0.6455078125,
|
35 |
"learning_rate": 0.0002,
|
36 |
+
"loss": 0.5064,
|
37 |
"step": 40
|
38 |
},
|
39 |
{
|
40 |
"epoch": 0.6872852233676976,
|
41 |
+
"grad_norm": 0.62451171875,
|
42 |
"learning_rate": 0.0002,
|
43 |
+
"loss": 0.4592,
|
44 |
"step": 50
|
45 |
},
|
46 |
{
|
47 |
"epoch": 0.8247422680412371,
|
48 |
+
"grad_norm": 0.62939453125,
|
49 |
"learning_rate": 0.0002,
|
50 |
+
"loss": 0.4184,
|
51 |
"step": 60
|
52 |
}
|
53 |
],
|
checkpoint-60/training_args.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 5304
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:540f901f89791921e9b3cf9ab4587377c091add791e4fe4b6656820764ebd035
|
3 |
size 5304
|
checkpoint-70/adapter_config.json
CHANGED
@@ -20,8 +20,8 @@
|
|
20 |
"rank_pattern": {},
|
21 |
"revision": null,
|
22 |
"target_modules": [
|
23 |
-
"
|
24 |
-
"
|
25 |
],
|
26 |
"task_type": "CAUSAL_LM",
|
27 |
"use_dora": false,
|
|
|
20 |
"rank_pattern": {},
|
21 |
"revision": null,
|
22 |
"target_modules": [
|
23 |
+
"q_proj",
|
24 |
+
"v_proj"
|
25 |
],
|
26 |
"task_type": "CAUSAL_LM",
|
27 |
"use_dora": false,
|
checkpoint-70/adapter_model.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 6832600
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f04ffcdee92618373bf9bb9a11fcb0cdb11e80c344985c230fd759bc5ed2a2d1
|
3 |
size 6832600
|
checkpoint-70/optimizer.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 27338682
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c6485ad76d93d84ff54754fe6959052cbc580e340870978fff592572009a405b
|
3 |
size 27338682
|
checkpoint-70/trainer_state.json
CHANGED
@@ -10,51 +10,51 @@
|
|
10 |
"log_history": [
|
11 |
{
|
12 |
"epoch": 0.13745704467353953,
|
13 |
-
"grad_norm": 2.
|
14 |
"learning_rate": 0.0002,
|
15 |
-
"loss": 2.
|
16 |
"step": 10
|
17 |
},
|
18 |
{
|
19 |
"epoch": 0.27491408934707906,
|
20 |
-
"grad_norm": 1.
|
21 |
"learning_rate": 0.0002,
|
22 |
-
"loss": 1.
|
23 |
"step": 20
|
24 |
},
|
25 |
{
|
26 |
"epoch": 0.41237113402061853,
|
27 |
-
"grad_norm": 0.
|
28 |
"learning_rate": 0.0002,
|
29 |
-
"loss": 0.
|
30 |
"step": 30
|
31 |
},
|
32 |
{
|
33 |
"epoch": 0.5498281786941581,
|
34 |
-
"grad_norm": 0.
|
35 |
"learning_rate": 0.0002,
|
36 |
-
"loss": 0.
|
37 |
"step": 40
|
38 |
},
|
39 |
{
|
40 |
"epoch": 0.6872852233676976,
|
41 |
-
"grad_norm": 0.
|
42 |
"learning_rate": 0.0002,
|
43 |
-
"loss": 0.
|
44 |
"step": 50
|
45 |
},
|
46 |
{
|
47 |
"epoch": 0.8247422680412371,
|
48 |
-
"grad_norm": 0.
|
49 |
"learning_rate": 0.0002,
|
50 |
-
"loss": 0.
|
51 |
"step": 60
|
52 |
},
|
53 |
{
|
54 |
"epoch": 0.9621993127147767,
|
55 |
-
"grad_norm": 0.
|
56 |
"learning_rate": 0.0002,
|
57 |
-
"loss": 0.
|
58 |
"step": 70
|
59 |
}
|
60 |
],
|
|
|
10 |
"log_history": [
|
11 |
{
|
12 |
"epoch": 0.13745704467353953,
|
13 |
+
"grad_norm": 2.5390625,
|
14 |
"learning_rate": 0.0002,
|
15 |
+
"loss": 2.5496,
|
16 |
"step": 10
|
17 |
},
|
18 |
{
|
19 |
"epoch": 0.27491408934707906,
|
20 |
+
"grad_norm": 1.5771484375,
|
21 |
"learning_rate": 0.0002,
|
22 |
+
"loss": 1.1222,
|
23 |
"step": 20
|
24 |
},
|
25 |
{
|
26 |
"epoch": 0.41237113402061853,
|
27 |
+
"grad_norm": 0.66748046875,
|
28 |
"learning_rate": 0.0002,
|
29 |
+
"loss": 0.5563,
|
30 |
"step": 30
|
31 |
},
|
32 |
{
|
33 |
"epoch": 0.5498281786941581,
|
34 |
+
"grad_norm": 0.6455078125,
|
35 |
"learning_rate": 0.0002,
|
36 |
+
"loss": 0.5064,
|
37 |
"step": 40
|
38 |
},
|
39 |
{
|
40 |
"epoch": 0.6872852233676976,
|
41 |
+
"grad_norm": 0.62451171875,
|
42 |
"learning_rate": 0.0002,
|
43 |
+
"loss": 0.4592,
|
44 |
"step": 50
|
45 |
},
|
46 |
{
|
47 |
"epoch": 0.8247422680412371,
|
48 |
+
"grad_norm": 0.62939453125,
|
49 |
"learning_rate": 0.0002,
|
50 |
+
"loss": 0.4184,
|
51 |
"step": 60
|
52 |
},
|
53 |
{
|
54 |
"epoch": 0.9621993127147767,
|
55 |
+
"grad_norm": 0.576171875,
|
56 |
"learning_rate": 0.0002,
|
57 |
+
"loss": 0.4028,
|
58 |
"step": 70
|
59 |
}
|
60 |
],
|
checkpoint-70/training_args.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 5304
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:540f901f89791921e9b3cf9ab4587377c091add791e4fe4b6656820764ebd035
|
3 |
size 5304
|
checkpoint-72/adapter_config.json
CHANGED
@@ -20,8 +20,8 @@
|
|
20 |
"rank_pattern": {},
|
21 |
"revision": null,
|
22 |
"target_modules": [
|
23 |
-
"
|
24 |
-
"
|
25 |
],
|
26 |
"task_type": "CAUSAL_LM",
|
27 |
"use_dora": false,
|
|
|
20 |
"rank_pattern": {},
|
21 |
"revision": null,
|
22 |
"target_modules": [
|
23 |
+
"q_proj",
|
24 |
+
"v_proj"
|
25 |
],
|
26 |
"task_type": "CAUSAL_LM",
|
27 |
"use_dora": false,
|
checkpoint-72/adapter_model.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 6832600
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:089e9b02962974c75c6049905f2ab2ce48248b37664b9f385cca31095074a258
|
3 |
size 6832600
|
checkpoint-72/optimizer.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 27338682
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cd63f16da461c601f3eb92aca1b749245db35b4cb28b7cdd759e8ca918c0566d
|
3 |
size 27338682
|
checkpoint-72/trainer_state.json
CHANGED
@@ -10,51 +10,51 @@
|
|
10 |
"log_history": [
|
11 |
{
|
12 |
"epoch": 0.13745704467353953,
|
13 |
-
"grad_norm": 2.
|
14 |
"learning_rate": 0.0002,
|
15 |
-
"loss": 2.
|
16 |
"step": 10
|
17 |
},
|
18 |
{
|
19 |
"epoch": 0.27491408934707906,
|
20 |
-
"grad_norm": 1.
|
21 |
"learning_rate": 0.0002,
|
22 |
-
"loss": 1.
|
23 |
"step": 20
|
24 |
},
|
25 |
{
|
26 |
"epoch": 0.41237113402061853,
|
27 |
-
"grad_norm": 0.
|
28 |
"learning_rate": 0.0002,
|
29 |
-
"loss": 0.
|
30 |
"step": 30
|
31 |
},
|
32 |
{
|
33 |
"epoch": 0.5498281786941581,
|
34 |
-
"grad_norm": 0.
|
35 |
"learning_rate": 0.0002,
|
36 |
-
"loss": 0.
|
37 |
"step": 40
|
38 |
},
|
39 |
{
|
40 |
"epoch": 0.6872852233676976,
|
41 |
-
"grad_norm": 0.
|
42 |
"learning_rate": 0.0002,
|
43 |
-
"loss": 0.
|
44 |
"step": 50
|
45 |
},
|
46 |
{
|
47 |
"epoch": 0.8247422680412371,
|
48 |
-
"grad_norm": 0.
|
49 |
"learning_rate": 0.0002,
|
50 |
-
"loss": 0.
|
51 |
"step": 60
|
52 |
},
|
53 |
{
|
54 |
"epoch": 0.9621993127147767,
|
55 |
-
"grad_norm": 0.
|
56 |
"learning_rate": 0.0002,
|
57 |
-
"loss": 0.
|
58 |
"step": 70
|
59 |
}
|
60 |
],
|
|
|
10 |
"log_history": [
|
11 |
{
|
12 |
"epoch": 0.13745704467353953,
|
13 |
+
"grad_norm": 2.5390625,
|
14 |
"learning_rate": 0.0002,
|
15 |
+
"loss": 2.5496,
|
16 |
"step": 10
|
17 |
},
|
18 |
{
|
19 |
"epoch": 0.27491408934707906,
|
20 |
+
"grad_norm": 1.5771484375,
|
21 |
"learning_rate": 0.0002,
|
22 |
+
"loss": 1.1222,
|
23 |
"step": 20
|
24 |
},
|
25 |
{
|
26 |
"epoch": 0.41237113402061853,
|
27 |
+
"grad_norm": 0.66748046875,
|
28 |
"learning_rate": 0.0002,
|
29 |
+
"loss": 0.5563,
|
30 |
"step": 30
|
31 |
},
|
32 |
{
|
33 |
"epoch": 0.5498281786941581,
|
34 |
+
"grad_norm": 0.6455078125,
|
35 |
"learning_rate": 0.0002,
|
36 |
+
"loss": 0.5064,
|
37 |
"step": 40
|
38 |
},
|
39 |
{
|
40 |
"epoch": 0.6872852233676976,
|
41 |
+
"grad_norm": 0.62451171875,
|
42 |
"learning_rate": 0.0002,
|
43 |
+
"loss": 0.4592,
|
44 |
"step": 50
|
45 |
},
|
46 |
{
|
47 |
"epoch": 0.8247422680412371,
|
48 |
+
"grad_norm": 0.62939453125,
|
49 |
"learning_rate": 0.0002,
|
50 |
+
"loss": 0.4184,
|
51 |
"step": 60
|
52 |
},
|
53 |
{
|
54 |
"epoch": 0.9621993127147767,
|
55 |
+
"grad_norm": 0.576171875,
|
56 |
"learning_rate": 0.0002,
|
57 |
+
"loss": 0.4028,
|
58 |
"step": 70
|
59 |
}
|
60 |
],
|
checkpoint-72/training_args.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 5304
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:540f901f89791921e9b3cf9ab4587377c091add791e4fe4b6656820764ebd035
|
3 |
size 5304
|