Model save

Browse files

Files changed (6) hide show

README.md +13 -23
adapter_config.json +3 -2
adapter_model.safetensors +1 -1
runs/Mar17_15-20-21_485a833b00a5/events.out.tfevents.1710688822.485a833b00a5.160.0 +3 -0
runs/Mar17_15-20-21_485a833b00a5/events.out.tfevents.1710692008.485a833b00a5.160.1 +3 -0
training_args.bin +1 -1

README.md CHANGED Viewed

@@ -14,7 +14,7 @@ should probably proofread and complete it, then remove this comment. -->
 This model is a fine-tuned version of [meta-llama/Llama-2-7b-chat-hf](https://huggingface.co/meta-llama/Llama-2-7b-chat-hf) on an unknown dataset.
 It achieves the following results on the evaluation set:
-- Loss: 2.1092
 ## Model description
@@ -39,37 +39,27 @@ The following hyperparameters were used during training:
 - seed: 42
 - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
 - lr_scheduler_type: linear
-- training_steps: 200
 ### Training results
 | Training Loss | Epoch | Step | Validation Loss |
 |:-------------:|:-----:|:----:|:---------------:|
-| 2.7967        | 0.22  | 10   | 2.7779          |
-| 2.5905        | 0.44  | 20   | 2.5530          |
-| 2.3863        | 0.67  | 30   | 2.4699          |
-| 2.3334        | 0.89  | 40   | 2.3923          |
-| 2.313         | 1.11  | 50   | 2.3418          |
-| 2.0965        | 1.33  | 60   | 2.2902          |
-| 2.2402        | 1.56  | 70   | 2.2599          |
-| 2.213         | 1.78  | 80   | 2.2329          |
-| 2.1118        | 2.0   | 90   | 2.2142          |
-| 2.071         | 2.22  | 100  | 2.1969          |
-| 2.0024        | 2.44  | 110  | 2.1846          |
-| 2.0814        | 2.67  | 120  | 2.1692          |
-| 2.0853        | 2.89  | 130  | 2.1540          |
-| 1.9573        | 3.11  | 140  | 2.1419          |
-| 1.9231        | 3.33  | 150  | 2.1358          |
-| 1.921         | 3.56  | 160  | 2.1240          |
-| 1.9618        | 3.78  | 170  | 2.1166          |
-| 2.0817        | 4.0   | 180  | 2.1120          |
-| 2.0458        | 4.22  | 190  | 2.1102          |
-| 1.9076        | 4.44  | 200  | 2.1092          |
 ### Framework versions
 - Transformers 4.39.0.dev0
-- Pytorch 2.1.0+cu121
 - Datasets 2.18.0
 - Tokenizers 0.15.2

 This model is a fine-tuned version of [meta-llama/Llama-2-7b-chat-hf](https://huggingface.co/meta-llama/Llama-2-7b-chat-hf) on an unknown dataset.
 It achieves the following results on the evaluation set:
+- Loss: 2.4423
 ## Model description
 - seed: 42
 - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
 - lr_scheduler_type: linear
+- training_steps: 100
 ### Training results
 | Training Loss | Epoch | Step | Validation Loss |
 |:-------------:|:-----:|:----:|:---------------:|
+| 3.3431        | 0.03  | 10   | 3.1212          |
+| 2.8976        | 0.05  | 20   | 2.7770          |
+| 2.6878        | 0.08  | 30   | 2.6526          |
+| 2.6344        | 0.1   | 40   | 2.5690          |
+| 2.5165        | 0.13  | 50   | 2.5212          |
+| 2.5377        | 0.15  | 60   | 2.4917          |
+| 2.4577        | 0.18  | 70   | 2.4712          |
+| 2.4309        | 0.21  | 80   | 2.4562          |
+| 2.3986        | 0.23  | 90   | 2.4465          |
+| 2.4445        | 0.26  | 100  | 2.4423          |
 ### Framework versions
 - Transformers 4.39.0.dev0
+- Pytorch 2.2.1+cu121
 - Datasets 2.18.0
 - Tokenizers 0.15.2

adapter_config.json CHANGED Viewed

@@ -6,6 +6,7 @@
   "fan_in_fan_out": false,
   "inference_mode": false,
   "init_lora_weights": true,
   "layers_pattern": null,
   "layers_to_transform": null,
   "loftq_config": {},
@@ -19,8 +20,8 @@
   "rank_pattern": {},
   "revision": null,
   "target_modules": [
-    "q_proj",
-    "v_proj"
   ],
   "task_type": "CAUSAL_LM",
   "use_dora": false,

   "fan_in_fan_out": false,
   "inference_mode": false,
   "init_lora_weights": true,
+  "layer_replication": null,
   "layers_pattern": null,
   "layers_to_transform": null,
   "loftq_config": {},
   "rank_pattern": {},
   "revision": null,
   "target_modules": [
+    "v_proj",
+    "q_proj"
   ],
   "task_type": "CAUSAL_LM",
   "use_dora": false,

adapter_model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:9cfd9d88b14058fbf3ad8ce7f236add4e59c361dba6448a89d28a1cd7aaa299d
 size 16794200

 version https://git-lfs.github.com/spec/v1
+oid sha256:ed7d6de8b7c52bacd210c20b16faf33905e39b10e5ca18f9a2cbd91b0493a979
 size 16794200

runs/Mar17_15-20-21_485a833b00a5/events.out.tfevents.1710688822.485a833b00a5.160.0 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:d19dbb32d4a95c0220438c50528a10848fa59e65ebba69ee233d9ee1fbf74446
+size 10154

runs/Mar17_15-20-21_485a833b00a5/events.out.tfevents.1710692008.485a833b00a5.160.1 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:b040b90e368ebe0af6f66de3061df2c474fb78dd09c7844aac4da6867e24993e
+size 354

training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:e4a6eff38eb5e666f4a74d12cf9f1f08bca89d3040a9ba99e04778a0b5f7043c
 size 4856

 version https://git-lfs.github.com/spec/v1
+oid sha256:3cddfc46772e5e0a83d0d3f74a3c7cc05afdb6eafd14efd3a5696416970e40ab
 size 4856