MohamedAAK
/

my_awesome_power_model_llm

Text Generation

generated_from_keras_callback

Inference Endpoints

Model card Files Files and versions Community

MohamedAAK commited on Jan 27, 2024

Commit

8013823

·

1 Parent(s): db2d3e2

Training in progress epoch 0

Files changed (3) hide show

README.md +3 -22
special_tokens_map.json +21 -3
tf_model.h5 +1 -1

README.md CHANGED Viewed

@@ -15,8 +15,8 @@ probably proofread and complete it, then remove this comment. -->
 This model is a fine-tuned version of [distilgpt2](https://huggingface.co/distilgpt2) on an unknown dataset.
 It achieves the following results on the evaluation set:
-- Train Loss: 2.1290
-- Epoch: 19
 ## Model description
@@ -42,26 +42,7 @@ The following hyperparameters were used during training:
 | Train Loss | Epoch |
 |:----------:|:-----:|
-| 7.2988     | 0     |
-| 3.1128     | 1     |
-| 2.9082     | 2     |
-| 2.8046     | 3     |
-| 2.7177     | 4     |
-| 2.6450     | 5     |
-| 2.5715     | 6     |
-| 2.5103     | 7     |
-| 2.4482     | 8     |
-| 2.3980     | 9     |
-| 2.3571     | 10    |
-| 2.3208     | 11    |
-| 2.2912     | 12    |
-| 2.2572     | 13    |
-| 2.2338     | 14    |
-| 2.2119     | 15    |
-| 2.1838     | 16    |
-| 2.1635     | 17    |
-| 2.1428     | 18    |
-| 2.1290     | 19    |
 ### Framework versions

 This model is a fine-tuned version of [distilgpt2](https://huggingface.co/distilgpt2) on an unknown dataset.
 It achieves the following results on the evaluation set:
+- Train Loss: 6.2910
+- Epoch: 0
 ## Model description
 | Train Loss | Epoch |
 |:----------:|:-----:|
+| 6.2910     | 0     |
 ### Framework versions

special_tokens_map.json CHANGED Viewed

@@ -1,6 +1,18 @@
 {
-  "bos_token": "<|endoftext|>",
-  "eos_token": "<|endoftext|>",
   "pad_token": {
     "content": "[PAD]",
     "lstrip": false,
@@ -8,5 +20,11 @@
     "rstrip": false,
     "single_word": false
   },
-  "unk_token": "<|endoftext|>"
 }

 {
+  "bos_token": {
+    "content": "<|endoftext|>",
+    "lstrip": false,
+    "normalized": true,
+    "rstrip": false,
+    "single_word": false
+  },
+  "eos_token": {
+    "content": "<|endoftext|>",
+    "lstrip": false,
+    "normalized": true,
+    "rstrip": false,
+    "single_word": false
+  },
   "pad_token": {
     "content": "[PAD]",
     "lstrip": false,
     "rstrip": false,
     "single_word": false
   },
+  "unk_token": {
+    "content": "<|endoftext|>",
+    "lstrip": false,
+    "normalized": true,
+    "rstrip": false,
+    "single_word": false
+  }
 }

tf_model.h5 CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:d443ceb3aad3a3955978ed9571f4dd93de1d929d181f796448fea55c289a1c3e
 size 327748552

 version https://git-lfs.github.com/spec/v1
+oid sha256:8786b81a6615a44a3cc68f96624f0b268f974263fc8474877ab2fcff4cf4f8ea
 size 327748552