staturecrane commited on
Commit
5a6e037
·
1 Parent(s): c76ffb5

Training in progress epoch 0

Browse files
Files changed (3) hide show
  1. README.md +2 -2
  2. tf_model.h5 +1 -1
  3. tokenizer.json +2 -14
README.md CHANGED
@@ -14,7 +14,7 @@ probably proofread and complete it, then remove this comment. -->
14
 
15
  This model is a fine-tuned version of [distilgpt2](https://huggingface.co/distilgpt2) on an unknown dataset.
16
  It achieves the following results on the evaluation set:
17
- - Train Loss: 3.0111
18
  - Epoch: 0
19
 
20
  ## Model description
@@ -41,7 +41,7 @@ The following hyperparameters were used during training:
41
 
42
  | Train Loss | Epoch |
43
  |:----------:|:-----:|
44
- | 3.0111 | 0 |
45
 
46
 
47
  ### Framework versions
 
14
 
15
  This model is a fine-tuned version of [distilgpt2](https://huggingface.co/distilgpt2) on an unknown dataset.
16
  It achieves the following results on the evaluation set:
17
+ - Train Loss: 3.0157
18
  - Epoch: 0
19
 
20
  ## Model description
 
41
 
42
  | Train Loss | Epoch |
43
  |:----------:|:-----:|
44
+ | 3.0157 | 0 |
45
 
46
 
47
  ### Framework versions
tf_model.h5 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:466389859c65b171a10544ba76fd001a161de4b72d0e5e238e4bdc281b74ef39
3
  size 327745472
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ea295e5c8c83aa0237ed599a34a291953e533dc57c7f45b72dc8b68054b3eb48
3
  size 327745472
tokenizer.json CHANGED
@@ -1,19 +1,7 @@
1
  {
2
  "version": "1.0",
3
- "truncation": {
4
- "direction": "Right",
5
- "max_length": 2048,
6
- "strategy": "LongestFirst",
7
- "stride": 0
8
- },
9
- "padding": {
10
- "strategy": "BatchLongest",
11
- "direction": "Right",
12
- "pad_to_multiple_of": null,
13
- "pad_id": 50256,
14
- "pad_type_id": 0,
15
- "pad_token": "<|endoftext|>"
16
- },
17
  "added_tokens": [
18
  {
19
  "id": 50256,
 
1
  {
2
  "version": "1.0",
3
+ "truncation": null,
4
+ "padding": null,
 
 
 
 
 
 
 
 
 
 
 
 
5
  "added_tokens": [
6
  {
7
  "id": 50256,