staturecrane
/

news_kg_model

Text Generation

generated_from_keras_callback

Inference Endpoints

Model card Files Files and versions Community

staturecrane commited on Apr 2, 2023

Commit

5a6e037

·

1 Parent(s): c76ffb5

Training in progress epoch 0

Files changed (3) hide show

README.md +2 -2
tf_model.h5 +1 -1
tokenizer.json +2 -14

README.md CHANGED Viewed

@@ -14,7 +14,7 @@ probably proofread and complete it, then remove this comment. -->
 This model is a fine-tuned version of [distilgpt2](https://huggingface.co/distilgpt2) on an unknown dataset.
 It achieves the following results on the evaluation set:
-- Train Loss: 3.0111
 - Epoch: 0
 ## Model description
@@ -41,7 +41,7 @@ The following hyperparameters were used during training:
 | Train Loss | Epoch |
 |:----------:|:-----:|
-| 3.0111     | 0     |
 ### Framework versions

 This model is a fine-tuned version of [distilgpt2](https://huggingface.co/distilgpt2) on an unknown dataset.
 It achieves the following results on the evaluation set:
+- Train Loss: 3.0157
 - Epoch: 0
 ## Model description
 | Train Loss | Epoch |
 |:----------:|:-----:|
+| 3.0157     | 0     |
 ### Framework versions

tf_model.h5 CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:466389859c65b171a10544ba76fd001a161de4b72d0e5e238e4bdc281b74ef39
 size 327745472

 version https://git-lfs.github.com/spec/v1
+oid sha256:ea295e5c8c83aa0237ed599a34a291953e533dc57c7f45b72dc8b68054b3eb48
 size 327745472

tokenizer.json CHANGED Viewed

@@ -1,19 +1,7 @@
 {
   "version": "1.0",
-  "truncation": {
-    "direction": "Right",
-    "max_length": 2048,
-    "strategy": "LongestFirst",
-    "stride": 0
-  },
-  "padding": {
-    "strategy": "BatchLongest",
-    "direction": "Right",
-    "pad_to_multiple_of": null,
-    "pad_id": 50256,
-    "pad_type_id": 0,
-    "pad_token": "<|endoftext|>"
-  },
   "added_tokens": [
     {
       "id": 50256,

 {
   "version": "1.0",
+  "truncation": null,
+  "padding": null,
   "added_tokens": [
     {
       "id": 50256,