AlekseyKorshuk commited on
Commit
b15a379
·
1 Parent(s): 854e925

huggingartists

Browse files
README.md CHANGED
@@ -45,15 +45,15 @@ from datasets import load_dataset
45
  dataset = load_dataset("huggingartists/cardi-b")
46
  ```
47
 
48
- [Explore the data](https://wandb.ai/huggingartists/huggingartists/runs/gyop804e/artifacts), which is tracked with [W&B artifacts](https://docs.wandb.com/artifacts) at every step of the pipeline.
49
 
50
  ## Training procedure
51
 
52
  The model is based on a pre-trained [GPT-2](https://huggingface.co/gpt2) which is fine-tuned on Cardi B's lyrics.
53
 
54
- Hyperparameters and metrics are recorded in the [W&B training run](https://wandb.ai/huggingartists/huggingartists/runs/2ls1zza7) for full transparency and reproducibility.
55
 
56
- At the end of training, [the final model](https://wandb.ai/huggingartists/huggingartists/runs/2ls1zza7/artifacts) is logged and versioned.
57
 
58
  ## How to use
59
 
 
45
  dataset = load_dataset("huggingartists/cardi-b")
46
  ```
47
 
48
+ [Explore the data](https://wandb.ai/huggingartists/huggingartists/runs/2794795e/artifacts), which is tracked with [W&B artifacts](https://docs.wandb.com/artifacts) at every step of the pipeline.
49
 
50
  ## Training procedure
51
 
52
  The model is based on a pre-trained [GPT-2](https://huggingface.co/gpt2) which is fine-tuned on Cardi B's lyrics.
53
 
54
+ Hyperparameters and metrics are recorded in the [W&B training run](https://wandb.ai/huggingartists/huggingartists/runs/1buiv5nf) for full transparency and reproducibility.
55
 
56
+ At the end of training, [the final model](https://wandb.ai/huggingartists/huggingartists/runs/1buiv5nf/artifacts) is logged and versioned.
57
 
58
  ## How to use
59
 
config.json CHANGED
@@ -1,5 +1,5 @@
1
  {
2
- "_name_or_path": "gpt2",
3
  "activation_function": "gelu_new",
4
  "architectures": [
5
  "GPT2LMHeadModel"
@@ -35,7 +35,7 @@
35
  }
36
  },
37
  "torch_dtype": "float32",
38
- "transformers_version": "4.10.2",
39
  "use_cache": true,
40
  "vocab_size": 50257
41
  }
 
1
  {
2
+ "_name_or_path": "huggingartists/cardi-b",
3
  "activation_function": "gelu_new",
4
  "architectures": [
5
  "GPT2LMHeadModel"
 
35
  }
36
  },
37
  "torch_dtype": "float32",
38
+ "transformers_version": "4.10.3",
39
  "use_cache": true,
40
  "vocab_size": 50257
41
  }
evaluation.txt CHANGED
@@ -1 +1 @@
1
- {"eval_loss": 3.3664300441741943, "eval_runtime": 1.6554, "eval_samples_per_second": 42.89, "eval_steps_per_second": 5.437, "epoch": 1.0}
 
1
+ {"eval_loss": 2.9845471382141113, "eval_runtime": 3.5891, "eval_samples_per_second": 21.454, "eval_steps_per_second": 2.786, "epoch": 2.0}
flax_model.msgpack CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:68dd29573f781095d9ad848fe4c8b6c2a22a1a287ec206a96c4ed108a61559c1
3
  size 497764120
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:aab7a5aa95958bd4c8c810e9b7acd8ff750da2c5eafe1cbbf3b6f40519373f40
3
  size 497764120
optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:49f94360ec805ce12fe6f0dfa4326451d8c48fda61a78c70af1e43e4ffd058d5
3
  size 995603825
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:89e6aded72e69f7bb9454c89045641fe99631a9eadc3ac776867f59a2b6ab290
3
  size 995603825
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:74955c53f4c610171358cb48c570ab0c10cc2b3ece76f517c6f6411aaa38644e
3
  size 510403817
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:69e9a718f89ae122d4823c99c69935afc63bdcdcdac02306b43ce41185505c77
3
  size 510403817
rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0def2032f81512e3f8bff61f3e21073854d8d398d1be01592c54d7bfc7c874fd
3
- size 14503
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:285cd8fb1eecf2a6ec93b901adfe605f19a10d2db64bcd2676529b2f8a13a1bf
3
+ size 14439
scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7e450cb9c3dd5d5e299310845f6d7ab8731c0d1d1d427cd56769b403ce862ce4
3
  size 623
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:858b0150f63e516bfdd54df0bdcc3e1de87c6a580f8d9790a43f52a335f62cca
3
  size 623
tokenizer_config.json CHANGED
@@ -1 +1 @@
1
- {"unk_token": "<|endoftext|>", "bos_token": "<|endoftext|>", "eos_token": "<|endoftext|>", "add_prefix_space": false, "model_max_length": 1024, "special_tokens_map_file": null, "name_or_path": "gpt2", "tokenizer_class": "GPT2Tokenizer"}
 
1
+ {"unk_token": "<|endoftext|>", "bos_token": "<|endoftext|>", "eos_token": "<|endoftext|>", "add_prefix_space": false, "model_max_length": 1024, "special_tokens_map_file": null, "name_or_path": "huggingartists/cardi-b", "tokenizer_class": "GPT2Tokenizer"}
trainer_state.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
- "best_metric": 3.3664300441741943,
3
- "best_model_checkpoint": "output/cardi-b/checkpoint-58",
4
- "epoch": 1.0,
5
- "global_step": 58,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
@@ -80,11 +80,85 @@
80
  "eval_samples_per_second": 44.424,
81
  "eval_steps_per_second": 5.631,
82
  "step": 58
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
83
  }
84
  ],
85
- "max_steps": 58,
86
- "num_train_epochs": 1,
87
- "total_flos": 59705229312000.0,
88
  "trial_name": null,
89
  "trial_params": null
90
  }
 
1
  {
2
+ "best_metric": 2.9845471382141113,
3
+ "best_model_checkpoint": "output/cardi-b/checkpoint-114",
4
+ "epoch": 2.0,
5
+ "global_step": 114,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
 
80
  "eval_samples_per_second": 44.424,
81
  "eval_steps_per_second": 5.631,
82
  "step": 58
83
+ },
84
+ {
85
+ "epoch": 1.05,
86
+ "learning_rate": 9.35614586573241e-07,
87
+ "loss": 3.234,
88
+ "step": 60
89
+ },
90
+ {
91
+ "epoch": 1.14,
92
+ "learning_rate": 6.5610987761461805e-06,
93
+ "loss": 3.3216,
94
+ "step": 65
95
+ },
96
+ {
97
+ "epoch": 1.23,
98
+ "learning_rate": 1.6868286569304916e-05,
99
+ "loss": 3.2467,
100
+ "step": 70
101
+ },
102
+ {
103
+ "epoch": 1.32,
104
+ "learning_rate": 3.1079356352801514e-05,
105
+ "loss": 3.3662,
106
+ "step": 75
107
+ },
108
+ {
109
+ "epoch": 1.4,
110
+ "learning_rate": 4.8121883965283725e-05,
111
+ "loss": 3.3484,
112
+ "step": 80
113
+ },
114
+ {
115
+ "epoch": 1.49,
116
+ "learning_rate": 6.670977211354408e-05,
117
+ "loss": 3.2623,
118
+ "step": 85
119
+ },
120
+ {
121
+ "epoch": 1.58,
122
+ "learning_rate": 8.54403044178588e-05,
123
+ "loss": 3.0856,
124
+ "step": 90
125
+ },
126
+ {
127
+ "epoch": 1.67,
128
+ "learning_rate": 0.00010290000000000001,
129
+ "loss": 3.2992,
130
+ "step": 95
131
+ },
132
+ {
133
+ "epoch": 1.75,
134
+ "learning_rate": 0.00011777128040335575,
135
+ "loss": 3.1025,
136
+ "step": 100
137
+ },
138
+ {
139
+ "epoch": 1.84,
140
+ "learning_rate": 0.00012893189933276512,
141
+ "loss": 3.2896,
142
+ "step": 105
143
+ },
144
+ {
145
+ "epoch": 1.93,
146
+ "learning_rate": 0.00013553963184824208,
147
+ "loss": 3.228,
148
+ "step": 110
149
+ },
150
+ {
151
+ "epoch": 2.0,
152
+ "eval_loss": 2.9845471382141113,
153
+ "eval_runtime": 3.4603,
154
+ "eval_samples_per_second": 22.252,
155
+ "eval_steps_per_second": 2.89,
156
+ "step": 114
157
  }
158
  ],
159
+ "max_steps": 114,
160
+ "num_train_epochs": 2,
161
+ "total_flos": 117581414400000.0,
162
  "trial_name": null,
163
  "trial_params": null
164
  }
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a62540a61b468205c2469fc48112f0523a3e5bd744b567b166b214b48f501b94
3
  size 2671
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a2f61ff06cbbabd7f1d12a195eee711fc2c26b1693ce37e36414e8203238c3e3
3
  size 2671