itti11 commited on Oct 27, 2024

Commit

2692d02

verified ·

1 Parent(s): ec8df03

Model save

Browse files

Files changed (26) hide show

README.md +12 -8
adapter_config.json +4 -4
adapter_model.safetensors +3 -0
runs/Oct27_15-30-26_graz/events.out.tfevents.1730010650.graz.1060953.0 +3 -0
runs/Oct27_15-35-07_graz/events.out.tfevents.1730010913.graz.1061216.0 +3 -0
runs/Oct27_15-36-40_graz/events.out.tfevents.1730011006.graz.1061496.0 +3 -0
runs/Oct27_15-38-22_graz/events.out.tfevents.1730011108.graz.1061695.0 +3 -0
runs/Oct27_15-46-54_graz/events.out.tfevents.1730011620.graz.1062153.0 +3 -0
runs/Oct27_15-48-15_graz/events.out.tfevents.1730011701.graz.1062488.0 +3 -0
runs/Oct27_15-49-17_graz/events.out.tfevents.1730011762.graz.1062687.0 +3 -0
runs/Oct27_16-32-58_graz/events.out.tfevents.1730014383.graz.1063356.0 +3 -0
runs/Oct27_16-34-17_graz/events.out.tfevents.1730014462.graz.1063557.0 +3 -0
runs/Oct27_16-35-02_graz/events.out.tfevents.1730014508.graz.1063769.0 +3 -0
runs/Oct27_16-48-37_graz/events.out.tfevents.1730015328.graz.1065240.0 +3 -0
runs/Oct27_16-50-13_graz/events.out.tfevents.1730015424.graz.1065447.0 +3 -0
runs/Oct27_16-51-10_graz/events.out.tfevents.1730015481.graz.1065650.0 +3 -0
runs/Oct27_16-59-08_graz/events.out.tfevents.1730015959.graz.1066060.0 +3 -0
runs/Oct27_17-09-13_graz/events.out.tfevents.1730016564.graz.1066690.0 +3 -0
runs/Oct27_17-10-33_graz/events.out.tfevents.1730016644.graz.1066893.0 +3 -0
runs/Oct27_17-11-48_graz/events.out.tfevents.1730016719.graz.1067096.0 +3 -0
runs/Oct27_17-12-50_graz/events.out.tfevents.1730016781.graz.1067299.0 +3 -0
runs/Oct27_18-01-15_graz/events.out.tfevents.1730019686.graz.1067916.0 +3 -0
runs/Oct27_18-04-27_graz/events.out.tfevents.1730019879.graz.1068110.0 +3 -0
runs/Oct27_18-08-33_graz/events.out.tfevents.1730020125.graz.1068561.0 +3 -0
runs/Oct27_18-09-10_graz/events.out.tfevents.1730020162.graz.1068744.0 +3 -0
training_args.bin +2 -2

README.md CHANGED Viewed

@@ -1,6 +1,7 @@
 ---
-license: cc-by-sa-4.0
-base_model: cyberagent/open-calm-3b
 tags:
 - generated_from_trainer
 model-index:
@@ -13,7 +14,7 @@ should probably proofread and complete it, then remove this comment. -->
 # lora
-This model is a fine-tuned version of [cyberagent/open-calm-3b](https://huggingface.co/cyberagent/open-calm-3b) on an unknown dataset.
 ## Model description
@@ -33,15 +34,17 @@ More information needed
 The following hyperparameters were used during training:
 - learning_rate: 2e-05
-- train_batch_size: 1
 - eval_batch_size: 8
 - seed: 42
 - gradient_accumulation_steps: 4
-- total_train_batch_size: 4
-- optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
 - lr_scheduler_type: linear
 - lr_scheduler_warmup_steps: 2
 - num_epochs: 2
 ### Training results
@@ -49,7 +52,8 @@ The following hyperparameters were used during training:
 ### Framework versions
-- Transformers 4.35.0.dev0
 - Pytorch 1.12.1+cu113
 - Datasets 2.6.1
-- Tokenizers 0.14.1

 ---
+base_model: rinna/japanese-gpt-neox-3.6b
+library_name: peft
+license: mit
 tags:
 - generated_from_trainer
 model-index:
 # lora
+This model is a fine-tuned version of [rinna/japanese-gpt-neox-3.6b](https://huggingface.co/rinna/japanese-gpt-neox-3.6b) on an unknown dataset.
 ## Model description
 The following hyperparameters were used during training:
 - learning_rate: 2e-05
+- train_batch_size: 4
 - eval_batch_size: 8
 - seed: 42
+- distributed_type: multi-GPU
 - gradient_accumulation_steps: 4
+- total_train_batch_size: 16
+- optimizer: Use adamw_hf with betas=(0.9,0.999) and epsilon=1e-08 and optimizer_args=No additional optimizer arguments
 - lr_scheduler_type: linear
 - lr_scheduler_warmup_steps: 2
 - num_epochs: 2
+- mixed_precision_training: Native AMP
 ### Training results
 ### Framework versions
+- PEFT 0.13.2
+- Transformers 4.46.0
 - Pytorch 1.12.1+cu113
 - Datasets 2.6.1
+- Tokenizers 0.20.1

adapter_config.json CHANGED Viewed

@@ -4,7 +4,7 @@
     "base_model_class": "GPTNeoXForCausalLM",
     "parent_library": "transformers.models.gpt_neox.modeling_gpt_neox"
   },
-  "base_model_name_or_path": "cyberagent/open-calm-3b",
   "bias": "none",
   "fan_in_fan_out": false,
   "inference_mode": true,
@@ -23,10 +23,10 @@
   "rank_pattern": {},
   "revision": null,
   "target_modules": [
-    "attention.query_key_value",
-    "mlp.dense_4h_to_h",
     "mlp.dense_h_to_4h",
-    "attention.dense"
   ],
   "task_type": null,
   "use_dora": true,

     "base_model_class": "GPTNeoXForCausalLM",
     "parent_library": "transformers.models.gpt_neox.modeling_gpt_neox"
   },
+  "base_model_name_or_path": "rinna/japanese-gpt-neox-3.6b",
   "bias": "none",
   "fan_in_fan_out": false,
   "inference_mode": true,
   "rank_pattern": {},
   "revision": null,
   "target_modules": [
     "mlp.dense_h_to_4h",
+    "attention.dense",
+    "mlp.dense_4h_to_h",
+    "attention.query_key_value"
   ],
   "task_type": null,
   "use_dora": true,

adapter_model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:1f9e660babf44b0418a0c73df182d426f49242f735d41c64ccf480f8d9c97ab1
+size 27837832

runs/Oct27_15-30-26_graz/events.out.tfevents.1730010650.graz.1060953.0 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:0ab917db4096f468f38492de34629e9524e93dbeef526df192adaf7de7597687
+size 5123

runs/Oct27_15-35-07_graz/events.out.tfevents.1730010913.graz.1061216.0 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:f74c48c3d3449a8a0e9bc7aac2be37663fde182435a3436cbd8a91de407661d9
+size 5123

runs/Oct27_15-36-40_graz/events.out.tfevents.1730011006.graz.1061496.0 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:e21a28dda2e26c27cfeff8679d4abc6ed4a3e822b7f350b8640a2d8d01bf9781
+size 5123

runs/Oct27_15-38-22_graz/events.out.tfevents.1730011108.graz.1061695.0 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:f7e790821063852310f4bdb886005345eb6b74ddfe2d95661182e7d5335ce1ce
+size 5123

runs/Oct27_15-46-54_graz/events.out.tfevents.1730011620.graz.1062153.0 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:2974f266c482e3b4c22032ba219e5e80d66eaae4203ce2ce5087e6e96148f2c5
+size 5123

runs/Oct27_15-48-15_graz/events.out.tfevents.1730011701.graz.1062488.0 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:bffc68e134127bc0fe415fdb951d288bd920712013f5307b652cc3afbfad2b20
+size 5123

runs/Oct27_15-49-17_graz/events.out.tfevents.1730011762.graz.1062687.0 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:04d5f93669cf853208cdf2fb4efe593c4ac8fb365768d1ca9507487990bc2cce
+size 5123

runs/Oct27_16-32-58_graz/events.out.tfevents.1730014383.graz.1063356.0 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:23bb18ba91ac24d8570498f138907d3b2f561e6ce8c7f48530e9b20b09020c10
+size 5080

runs/Oct27_16-34-17_graz/events.out.tfevents.1730014462.graz.1063557.0 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:22ff104c76a0726efed1b4ddee7c7bd1fb4d18bb5ac37e753f762f2da7db756d
+size 5080

runs/Oct27_16-35-02_graz/events.out.tfevents.1730014508.graz.1063769.0 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:8ad904360d119d905a57f67ddade39290d3dcef22ccdf5423b15ed4cd6fb4985
+size 5080

runs/Oct27_16-48-37_graz/events.out.tfevents.1730015328.graz.1065240.0 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:641caa0850f642adad3c23f33f4871fddb23a7c4a68a7b864789a9c1aff32cd0
+size 5079

runs/Oct27_16-50-13_graz/events.out.tfevents.1730015424.graz.1065447.0 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:77742a267a3812a98c6f99a4eec70c0b74824c913ce8987b8f25e93215dd22d8
+size 5079

runs/Oct27_16-51-10_graz/events.out.tfevents.1730015481.graz.1065650.0 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:05fcf06e37043efc30b38e00accd0a374adc4ec638797e56a8af439bb9279972
+size 5079

runs/Oct27_16-59-08_graz/events.out.tfevents.1730015959.graz.1066060.0 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:77301ab089dac40125ba46efb4d7e82d6df21cb8d0c7bb916d2f2f67d1fe6c5d
+size 5079

runs/Oct27_17-09-13_graz/events.out.tfevents.1730016564.graz.1066690.0 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:2f82ea3859dc67b54b6f3794198f38244f6d31c149c959e6d966e3062ab8d4a9
+size 5079

runs/Oct27_17-10-33_graz/events.out.tfevents.1730016644.graz.1066893.0 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:7d929530723af00d9df938801eeeb2a97725279de8fd4ef2b62bee183fa903f3
+size 5079

runs/Oct27_17-11-48_graz/events.out.tfevents.1730016719.graz.1067096.0 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:d15f3de998f21183368a7390b72fc13bf65b65ef2d5007a2c4a9d2b3434b70fc
+size 5078

runs/Oct27_17-12-50_graz/events.out.tfevents.1730016781.graz.1067299.0 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:aedc245bb3680102c92994b9e64b9d90924d42df0f9d119e8c049e369b6348c0
+size 5079

runs/Oct27_18-01-15_graz/events.out.tfevents.1730019686.graz.1067916.0 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:7c72e676e96922a4f4bb70d333752a43ae06ad43b33344e6fee976b5c0aee174
+size 5127

runs/Oct27_18-04-27_graz/events.out.tfevents.1730019879.graz.1068110.0 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:45ff6ec2df57929341f68fc3e0998965fe3242f02aa47107ec5c3616173acc1d
+size 5127

runs/Oct27_18-08-33_graz/events.out.tfevents.1730020125.graz.1068561.0 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:429e404c43c154aa1ed6941454dc3a92491c227aca02c31aa3e0c146fd2d5ecd
+size 5127

runs/Oct27_18-09-10_graz/events.out.tfevents.1730020162.graz.1068744.0 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:3cb874cf82f98bb9b4fc8299abf626de4b9995da6d7b326cce850566761a0d77
+size 5692

training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:c6aa331d73617c134b921dd72a3aa0f2069c9a5f1bf39a72c4e72348813b1ae7
-size 4015

 version https://git-lfs.github.com/spec/v1
+oid sha256:16a1898da87ecf03bba600ea114f4642e30b06e4011d1add4b3f2d37c1e366e5
+size 7151