HachiML commited on
Commit
d5d6f0a
·
verified ·
1 Parent(s): 16275bf

Upload 9 files

Browse files
benchmark_scores/result_jaqket_v2-0.2-0.2.json ADDED
@@ -0,0 +1,24 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "results": {
3
+ "jaqket_v2-0.2-0.2": {
4
+ "exact_match": 80.58419243986255,
5
+ "f1": 84.86990863279517
6
+ }
7
+ },
8
+ "versions": {
9
+ "jaqket_v2-0.2-0.2": 0.2
10
+ },
11
+ "config": {
12
+ "model": "hf-causal-experimental",
13
+ "model_args": "pretrained=HachiML/youri-2x7b_v0.2,tokenizer=HachiML/youri-2x7b_v0.2,use_accelerate=True,dtype=auto",
14
+ "num_fewshot": [
15
+ 1
16
+ ],
17
+ "batch_size": 2,
18
+ "device": "cuda",
19
+ "no_cache": false,
20
+ "limit": null,
21
+ "bootstrap_iters": 100000,
22
+ "description_dict": null
23
+ }
24
+ }
benchmark_scores/result_jcola.json ADDED
@@ -0,0 +1,26 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "results": {
3
+ "jcola": {
4
+ "balanced_acc": 0.5841310422736191,
5
+ "mcc": 0.13714598200194028,
6
+ "mcc_stderr": 0.03691630655102646,
7
+ "macro_f1": 0.5548345406141655
8
+ }
9
+ },
10
+ "versions": {
11
+ "jcola": 0.2
12
+ },
13
+ "config": {
14
+ "model": "hf-causal-experimental",
15
+ "model_args": "pretrained=HachiML/youri-2x7b_v0.2,tokenizer=HachiML/youri-2x7b_v0.2,use_accelerate=True,dtype=auto",
16
+ "num_fewshot": [
17
+ 5
18
+ ],
19
+ "batch_size": 2,
20
+ "device": "cuda",
21
+ "no_cache": false,
22
+ "limit": null,
23
+ "bootstrap_iters": 100000,
24
+ "description_dict": null
25
+ }
26
+ }
benchmark_scores/result_jcommonsenseqa-1.1-0.2.1.json ADDED
@@ -0,0 +1,26 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "results": {
3
+ "jcommonsenseqa-1.1-0.2.1": {
4
+ "acc": 0.9097408400357462,
5
+ "acc_stderr": 0.008570054575466593,
6
+ "acc_norm": 0.8302055406613047,
7
+ "acc_norm_stderr": 0.011228808341801134
8
+ }
9
+ },
10
+ "versions": {
11
+ "jcommonsenseqa-1.1-0.2.1": 1.1
12
+ },
13
+ "config": {
14
+ "model": "hf-causal-experimental",
15
+ "model_args": "pretrained=HachiML/youri-2x7b_v0.2,tokenizer=HachiML/youri-2x7b_v0.2,use_accelerate=True,dtype=auto",
16
+ "num_fewshot": [
17
+ 3
18
+ ],
19
+ "batch_size": 1,
20
+ "device": "cuda",
21
+ "no_cache": false,
22
+ "limit": null,
23
+ "bootstrap_iters": 100000,
24
+ "description_dict": null
25
+ }
26
+ }
benchmark_scores/result_jnli-1.3-0.2.json ADDED
@@ -0,0 +1,30 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "results": {
3
+ "jnli-1.3-0.2": {
4
+ "acc": 0.5875102711585867,
5
+ "acc_stderr": 0.009980291973884942,
6
+ "acc_norm": 0.5875102711585867,
7
+ "acc_norm_stderr": 0.009980291973884942,
8
+ "balanced_acc": 0.7118954352211451,
9
+ "mcc": 0.48341356747473024,
10
+ "mcc_stderr": 0.011948217496149275,
11
+ "macro_f1": 0.601774322498386
12
+ }
13
+ },
14
+ "versions": {
15
+ "jnli-1.3-0.2": 1.3
16
+ },
17
+ "config": {
18
+ "model": "hf-causal-experimental",
19
+ "model_args": "pretrained=HachiML/youri-2x7b_v0.2,tokenizer=HachiML/youri-2x7b_v0.2,use_accelerate=True,dtype=auto",
20
+ "num_fewshot": [
21
+ 3
22
+ ],
23
+ "batch_size": 8,
24
+ "device": "cuda",
25
+ "no_cache": false,
26
+ "limit": null,
27
+ "bootstrap_iters": 100000,
28
+ "description_dict": null
29
+ }
30
+ }
benchmark_scores/result_jsquad-1.2-0.2.json ADDED
@@ -0,0 +1,24 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "results": {
3
+ "jsquad-1.2-0.2": {
4
+ "exact_match": 80.14407924358397,
5
+ "f1": 91.31291346456423
6
+ }
7
+ },
8
+ "versions": {
9
+ "jsquad-1.2-0.2": 1.2
10
+ },
11
+ "config": {
12
+ "model": "hf-causal-experimental",
13
+ "model_args": "pretrained=HachiML/youri-2x7b_v0.2,tokenizer=HachiML/youri-2x7b_v0.2,use_accelerate=True,dtype=auto",
14
+ "num_fewshot": [
15
+ 2
16
+ ],
17
+ "batch_size": 1,
18
+ "device": "cuda",
19
+ "no_cache": false,
20
+ "limit": null,
21
+ "bootstrap_iters": 100000,
22
+ "description_dict": null
23
+ }
24
+ }
benchmark_scores/result_marc_ja-1.1-0.2.json ADDED
@@ -0,0 +1,30 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "results": {
3
+ "marc_ja-1.1-0.2": {
4
+ "acc": 0.9757693668199505,
5
+ "acc_stderr": 0.002045109088212568,
6
+ "acc_norm": 0.9757693668199505,
7
+ "acc_norm_stderr": 0.002045109088212568,
8
+ "balanced_acc": 0.9595742998823737,
9
+ "mcc": 0.9043294397096614,
10
+ "mcc_stderr": 0.00802664025288833,
11
+ "macro_f1": 0.9520408004687209
12
+ }
13
+ },
14
+ "versions": {
15
+ "marc_ja-1.1-0.2": 1.1
16
+ },
17
+ "config": {
18
+ "model": "hf-causal-experimental",
19
+ "model_args": "pretrained=HachiML/youri-2x7b_v0.2,tokenizer=HachiML/youri-2x7b_v0.2,use_accelerate=True,dtype=auto",
20
+ "num_fewshot": [
21
+ 0
22
+ ],
23
+ "batch_size": 2,
24
+ "device": "cuda",
25
+ "no_cache": false,
26
+ "limit": null,
27
+ "bootstrap_iters": 100000,
28
+ "description_dict": null
29
+ }
30
+ }
benchmark_scores/result_mgsm.json ADDED
@@ -0,0 +1,24 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "results": {
3
+ "mgsm": {
4
+ "acc": 0.232,
5
+ "acc_stderr": 0.026750070374865167
6
+ }
7
+ },
8
+ "versions": {
9
+ "mgsm": 1.0
10
+ },
11
+ "config": {
12
+ "model": "hf-causal-experimental",
13
+ "model_args": "pretrained=HachiML/youri-2x7b_v0.2,tokenizer=HachiML/youri-2x7b_v0.2,use_accelerate=True,dtype=auto",
14
+ "num_fewshot": [
15
+ 5
16
+ ],
17
+ "batch_size": 2,
18
+ "device": "cuda",
19
+ "no_cache": false,
20
+ "limit": null,
21
+ "bootstrap_iters": 100000,
22
+ "description_dict": null
23
+ }
24
+ }
benchmark_scores/result_xlsum_ja.json ADDED
@@ -0,0 +1,23 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "results": {
3
+ "xlsum_ja": {
4
+ "rouge2": 25.447876004263104
5
+ }
6
+ },
7
+ "versions": {
8
+ "xlsum_ja": 1.0
9
+ },
10
+ "config": {
11
+ "model": "hf-causal-experimental",
12
+ "model_args": "pretrained=HachiML/youri-2x7b_v0.2,tokenizer=HachiML/youri-2x7b_v0.2,use_accelerate=True,dtype=auto",
13
+ "num_fewshot": [
14
+ 1
15
+ ],
16
+ "batch_size": 2,
17
+ "device": "cuda",
18
+ "no_cache": false,
19
+ "limit": null,
20
+ "bootstrap_iters": 100000,
21
+ "description_dict": null
22
+ }
23
+ }
benchmark_scores/result_xwinograd_ja.json ADDED
@@ -0,0 +1,24 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "results": {
3
+ "xwinograd_ja": {
4
+ "acc": 0.8143899895724713,
5
+ "acc_stderr": 0.012561287517973916
6
+ }
7
+ },
8
+ "versions": {
9
+ "xwinograd_ja": 1.0
10
+ },
11
+ "config": {
12
+ "model": "hf-causal-experimental",
13
+ "model_args": "pretrained=HachiML/youri-2x7b_v0.2,tokenizer=HachiML/youri-2x7b_v0.2,use_accelerate=True,dtype=auto",
14
+ "num_fewshot": [
15
+ 0
16
+ ],
17
+ "batch_size": 2,
18
+ "device": "cuda",
19
+ "no_cache": false,
20
+ "limit": null,
21
+ "bootstrap_iters": 100000,
22
+ "description_dict": null
23
+ }
24
+ }