Tippawan
/

proof-reading-SeaLLM3-7B-Chat-3090-v7

@@ -6,7 +6,7 @@ tags:
 - axolotl
 - generated_from_trainer
 model-index:
-- name: proof-reading-SeaLLM3-7B-Chat-3090-v6
   results: []
 ---
@@ -26,7 +26,7 @@ load_in_4bit: true
 strict: false
 datasets:
-  - path: Tippawan/pr-6-seallm-messages-only
     type: sharegpt
     conversation: chatml
     field_messages: messages
@@ -41,7 +41,7 @@ eval_sample_packing: false
 pad_to_sequence_len: false
 push_to_hub: true
-hub_model_id: Tippawan/proof-reading-SeaLLM3-7B-Chat-3090-v6  # Replace with your Hugging Face repo ID
 use_auth_token: true  # Ensure you have set your Hugging Face API token in the environment
 hub_private_repo: true  # Set to true if you want the repository to be private
 hub_strategy: all_checkpoints
@@ -49,14 +49,14 @@ save_total_limit: 3
 load_best_model_at_end: true
 adapter: lora
-lora_model_dir: Tippawan/proof-reading-SeaLLM3-7B-Chat-3090-v5
 lora_r: 16
 lora_alpha: 32
 lora_dropout: 0.05
 lora_target_linear: true
 lora_fan_in_fan_out:
-wandb_project: proof-reading-SeaLLM3-7B-Chat-3090-v6
 wandb_entity:
 wandb_watch:
 wandb_name:
@@ -64,7 +64,7 @@ wandb_log_model:
 gradient_accumulation_steps: 4
 micro_batch_size: 8
-num_epochs: 10 #editted 3
 optimizer: adamw_torch
 lr_scheduler: cosine
 learning_rate: 0.0002
@@ -96,7 +96,7 @@ special_tokens:
 </details><br>
-# proof-reading-SeaLLM3-7B-Chat-3090-v6
 This model is a fine-tuned version of [SeaLLMs/SeaLLM3-7B-Chat](https://huggingface.co/SeaLLMs/SeaLLM3-7B-Chat) on the None dataset.
@@ -126,7 +126,7 @@ The following hyperparameters were used during training:
 - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
 - lr_scheduler_type: cosine
 - lr_scheduler_warmup_steps: 10
-- num_epochs: 10
 ### Training results

 - axolotl
 - generated_from_trainer
 model-index:
+- name: proof-reading-SeaLLM3-7B-Chat-3090-v7
   results: []
 ---
 strict: false
 datasets:
+  - path: Tippawan/pr-7-seallm
     type: sharegpt
     conversation: chatml
     field_messages: messages
 pad_to_sequence_len: false
 push_to_hub: true
+hub_model_id: Tippawan/proof-reading-SeaLLM3-7B-Chat-3090-v7  # Replace with your Hugging Face repo ID
 use_auth_token: true  # Ensure you have set your Hugging Face API token in the environment
 hub_private_repo: true  # Set to true if you want the repository to be private
 hub_strategy: all_checkpoints
 load_best_model_at_end: true
 adapter: lora
+lora_model_dir: Tippawan/proof-reading-SeaLLM3-7B-Chat-3090-v6
 lora_r: 16
 lora_alpha: 32
 lora_dropout: 0.05
 lora_target_linear: true
 lora_fan_in_fan_out:
+wandb_project: proof-reading-SeaLLM3-7B-Chat-3090-v7
 wandb_entity:
 wandb_watch:
 wandb_name:
 gradient_accumulation_steps: 4
 micro_batch_size: 8
+num_epochs: 1 #editted 3
 optimizer: adamw_torch
 lr_scheduler: cosine
 learning_rate: 0.0002
 </details><br>
+# proof-reading-SeaLLM3-7B-Chat-3090-v7
 This model is a fine-tuned version of [SeaLLMs/SeaLLM3-7B-Chat](https://huggingface.co/SeaLLMs/SeaLLM3-7B-Chat) on the None dataset.
 - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
 - lr_scheduler_type: cosine
 - lr_scheduler_warmup_steps: 10
+- num_epochs: 1
 ### Training results

adapter_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:b34f0b8b3c4464ace9eb97017538ef0a0d11f2df2637924714bd32bd7b5994bc
 size 161621802

 version https://git-lfs.github.com/spec/v1
+oid sha256:148fcbc3147964e77cd19ea6bcf16d29a91db5a9938b555fcc453b35032ca6d5
 size 161621802