winglian commited on
Commit
dd5fe97
·
1 Parent(s): 47b1370

Upload folder using huggingface_hub

Browse files
Files changed (1) hide show
  1. configs/3b-pt.yml +68 -0
configs/3b-pt.yml ADDED
@@ -0,0 +1,68 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ base_model: winglian/Llama-2-3b-hf
2
+ base_model_config: winglian/Llama-2-3b-hf
3
+ model_type: LlamaForCausalLM
4
+ tokenizer_type: LlamaTokenizer
5
+ load_in_8bit: false
6
+ load_in_4bit: false
7
+ hub_model_id: winglian/llama-2-3b-cpt
8
+ strict: false
9
+ # pretraining_dataset: togethercomputer/RedPajama-Data-1T-Sample
10
+ push_dataset_to_hub:
11
+ datasets:
12
+ - path: togethercomputer/RedPajama-Data-1T-Sample
13
+ type: completion
14
+ dataset_prepared_path: last_run_prepared
15
+ val_set_size: 0.0
16
+ adapter:
17
+ lora_model_dir:
18
+ sequence_len: 4096
19
+ sample_packing:
20
+ lora_r:
21
+ lora_alpha:
22
+ lora_dropout:
23
+ lora_target_modules:
24
+ lora_target_linear:
25
+ lora_fan_in_fan_out:
26
+ wandb_project: llama-2-3b-cpt
27
+ wandb_entity:
28
+ wandb_watch:
29
+ wandb_run_id:
30
+ wandb_log_model:
31
+ output_dir: ./llama-2-3b-out
32
+ # max_steps: 4400
33
+ gradient_accumulation_steps: 3
34
+ micro_batch_size: 8
35
+ num_epochs: 1
36
+ optimizer: adamw_torch
37
+ adam_beta2: 0.95
38
+ torchdistx_path:
39
+ lr_scheduler: cosine
40
+ learning_rate: 0.0001
41
+ train_on_inputs: false
42
+ group_by_length: false
43
+ float16: true
44
+ bf16: truc
45
+ fp16: false
46
+ tf32: true
47
+ gradient_checkpointing: true
48
+ early_stopping_patience:
49
+ resume_from_checkpoint:
50
+ local_rank:
51
+ logging_steps: 1
52
+ xformers_attention:
53
+ flash_attention: true
54
+ gptq_groupsize:
55
+ gptq_model_v1:
56
+ warmup_steps: 100
57
+ eval_steps:
58
+ save_steps: 100
59
+ save_total_limit: 6
60
+ debug:
61
+ deepspeed:
62
+ weight_decay: 0.1
63
+ fsdp:
64
+ fsdp_config:
65
+ special_tokens:
66
+ bos_token: "<s>"
67
+ eos_token: "</s>"
68
+ unk_token: "<unk>"