JaviManobanda commited on
Commit
37fae62
·
verified ·
1 Parent(s): 09ad404

End of training

Browse files
README.md CHANGED
@@ -17,9 +17,9 @@ should probably proofread and complete it, then remove this comment. -->
17
 
18
  This model is a fine-tuned version of [google/flan-t5-small](https://huggingface.co/google/flan-t5-small) on the None dataset.
19
  It achieves the following results on the evaluation set:
20
- - Loss: 0.0247
21
- - F1: 97.2892
22
- - Gen Len: 7.6006
23
 
24
  ## Model description
25
 
@@ -44,15 +44,19 @@ The following hyperparameters were used during training:
44
  - seed: 42
45
  - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
46
  - lr_scheduler_type: linear
47
- - num_epochs: 10
48
 
49
  ### Training results
50
 
 
 
 
 
51
 
52
 
53
  ### Framework versions
54
 
55
  - Transformers 4.44.0
56
  - Pytorch 2.4.0
57
- - Datasets 3.0.1
58
  - Tokenizers 0.19.1
 
17
 
18
  This model is a fine-tuned version of [google/flan-t5-small](https://huggingface.co/google/flan-t5-small) on the None dataset.
19
  It achieves the following results on the evaluation set:
20
+ - Loss: 0.0423
21
+ - F1: 97.5301
22
+ - Gen Len: 2.6047
23
 
24
  ## Model description
25
 
 
44
  - seed: 42
45
  - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
46
  - lr_scheduler_type: linear
47
+ - num_epochs: 2
48
 
49
  ### Training results
50
 
51
+ | Training Loss | Epoch | Step | Validation Loss | F1 | Gen Len |
52
+ |:-------------:|:-----:|:----:|:---------------:|:-------:|:-------:|
53
+ | 0.0893 | 1.0 | 1385 | 0.0434 | 96.3938 | 2.6218 |
54
+ | 0.0324 | 2.0 | 2770 | 0.0423 | 97.5301 | 2.6047 |
55
 
56
 
57
  ### Framework versions
58
 
59
  - Transformers 4.44.0
60
  - Pytorch 2.4.0
61
+ - Datasets 3.1.0
62
  - Tokenizers 0.19.1
logs/events.out.tfevents.1734432976.c5d1fc1ff2cc.23.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2fd3f1f1c4944dd361ce414961500ed1ce24dd70d488666708a6098c321de720
3
+ size 456
tokenizer.json CHANGED
@@ -2,13 +2,13 @@
2
  "version": "1.0",
3
  "truncation": {
4
  "direction": "Right",
5
- "max_length": 8,
6
  "strategy": "LongestFirst",
7
  "stride": 0
8
  },
9
  "padding": {
10
  "strategy": {
11
- "Fixed": 8
12
  },
13
  "direction": "Right",
14
  "pad_to_multiple_of": null,
 
2
  "version": "1.0",
3
  "truncation": {
4
  "direction": "Right",
5
+ "max_length": 3,
6
  "strategy": "LongestFirst",
7
  "stride": 0
8
  },
9
  "padding": {
10
  "strategy": {
11
+ "Fixed": 3
12
  },
13
  "direction": "Right",
14
  "pad_to_multiple_of": null,
tokenizer_config.json CHANGED
@@ -927,7 +927,7 @@
927
  "<extra_id_98>",
928
  "<extra_id_99>"
929
  ],
930
- "clean_up_tokenization_spaces": false,
931
  "eos_token": "</s>",
932
  "extra_ids": 100,
933
  "model_max_length": 512,
 
927
  "<extra_id_98>",
928
  "<extra_id_99>"
929
  ],
930
+ "clean_up_tokenization_spaces": true,
931
  "eos_token": "</s>",
932
  "extra_ids": 100,
933
  "model_max_length": 512,