Iheb-Chaabane commited on
Commit
a235660
1 Parent(s): d89607f

Upload LlamaForCausalLM

Browse files
Files changed (3) hide show
  1. config.json +4 -2
  2. generation_config.json +2 -0
  3. model.safetensors +1 -1
config.json CHANGED
@@ -1,17 +1,19 @@
1
  {
2
- "_name_or_path": "config.json",
 
3
  "architectures": [
4
  "LlamaForCausalLM"
5
  ],
6
  "attention_bias": false,
7
  "attention_dropout": 0.0,
 
8
  "eos_token_id": 11,
9
  "head_dim": 256,
10
  "hidden_act": "silu",
11
  "hidden_size": 2048,
12
  "initializer_range": 0.02,
13
  "intermediate_size": 8192,
14
- "max_position_embeddings": 32768,
15
  "mlp_bias": false,
16
  "model_type": "llama",
17
  "num_attention_heads": 8,
 
1
  {
2
+ "_name_or_path": "/home/ec2-user/work/1b-base",
3
+ "activation": "swiglu",
4
  "architectures": [
5
  "LlamaForCausalLM"
6
  ],
7
  "attention_bias": false,
8
  "attention_dropout": 0.0,
9
+ "bos_token_id": 11,
10
  "eos_token_id": 11,
11
  "head_dim": 256,
12
  "hidden_act": "silu",
13
  "hidden_size": 2048,
14
  "initializer_range": 0.02,
15
  "intermediate_size": 8192,
16
+ "max_position_embeddings": 4096,
17
  "mlp_bias": false,
18
  "model_type": "llama",
19
  "num_attention_heads": 8,
generation_config.json CHANGED
@@ -1,4 +1,6 @@
1
  {
 
 
2
  "eos_token_id": 11,
3
  "transformers_version": "4.46.1"
4
  }
 
1
  {
2
+ "_from_model_config": true,
3
+ "bos_token_id": 11,
4
  "eos_token_id": 11,
5
  "transformers_version": "4.46.1"
6
  }
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:332c2b9380c4eae0c33827d36e6c74c47c34262acf808ac694184ae81cb59713
3
  size 3338836632
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9c2c3117923ab2e22e8d07a92cd8fd069ce70a8b1c8557894194bbfd8fcee196
3
  size 3338836632