hoganpham commited on
Commit
9a8b92f
·
verified ·
1 Parent(s): 34ef531

Training in progress, step 500

Browse files
config.json CHANGED
@@ -1,5 +1,6 @@
1
  {
2
- "_name_or_path": "gpt2",
 
3
  "activation_function": "gelu_new",
4
  "architectures": [
5
  "GPT2LMHeadModel"
@@ -8,14 +9,20 @@
8
  "bos_token_id": 50256,
9
  "embd_pdrop": 0.1,
10
  "eos_token_id": 50256,
 
 
 
11
  "initializer_range": 0.02,
 
 
 
12
  "layer_norm_epsilon": 1e-05,
13
  "model_type": "gpt2",
14
  "n_ctx": 1024,
15
  "n_embd": 768,
16
  "n_head": 12,
17
  "n_inner": null,
18
- "n_layer": 12,
19
  "n_positions": 1024,
20
  "reorder_and_upcast_attn": false,
21
  "resid_pdrop": 0.1,
 
1
  {
2
+ "_name_or_path": "distilgpt2",
3
+ "_num_labels": 1,
4
  "activation_function": "gelu_new",
5
  "architectures": [
6
  "GPT2LMHeadModel"
 
9
  "bos_token_id": 50256,
10
  "embd_pdrop": 0.1,
11
  "eos_token_id": 50256,
12
+ "id2label": {
13
+ "0": "LABEL_0"
14
+ },
15
  "initializer_range": 0.02,
16
+ "label2id": {
17
+ "LABEL_0": 0
18
+ },
19
  "layer_norm_epsilon": 1e-05,
20
  "model_type": "gpt2",
21
  "n_ctx": 1024,
22
  "n_embd": 768,
23
  "n_head": 12,
24
  "n_inner": null,
25
+ "n_layer": 6,
26
  "n_positions": 1024,
27
  "reorder_and_upcast_attn": false,
28
  "resid_pdrop": 0.1,
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5609ac6f01101d2bcb425aa64610463292a0fe69c5001c2522d8c213dfd822b8
3
- size 497774208
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:04832d090896cb5272c3d91e178a83d4a301826fb74b6f10cbcd85270e4e7f45
3
+ size 327657928
runs/Dec26_14-30-20_4f87fa13cf4f/events.out.tfevents.1735223422.4f87fa13cf4f.48986.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7d808b3160144279fcf5c5662f60584f2ae9498334eb011d259bca1a6b6f6a78
3
+ size 5329
runs/Dec26_15-17-35_4f87fa13cf4f/events.out.tfevents.1735226257.4f87fa13cf4f.52160.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b681d61fe327edf63094efd3caaed004a06267047b8f8aadfed62cf39b500f6a
3
+ size 5329
runs/Dec26_15-18-47_4f87fa13cf4f/events.out.tfevents.1735226328.4f87fa13cf4f.52529.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f1f0fcde8d6c9a22ea5ef5b24cce47f57eec38e5d4df36e54a8074664bf1e7b8
3
+ size 6025
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9f301c938db1cb6977900c5e27614e30ccd7fd4df22c121c98fedc0e91b2cf20
3
  size 5240
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:44da7eabc06c79a1f80607609567e44ae9ae320d05d9c4883a152a08f36e8f4f
3
  size 5240