Ghanvert commited on
Commit
55dc913
·
verified ·
1 Parent(s): b5de23b

model updated

Browse files
Files changed (4) hide show
  1. config.json +2 -2
  2. generation_config.json +1 -1
  3. pytorch_model.bin +3 -0
  4. status.json +7 -2
config.json CHANGED
@@ -27,8 +27,8 @@
27
  "num_hidden_layers": 24,
28
  "pad_token_id": 1,
29
  "scale_embedding": true,
30
- "torch_dtype": "float32",
31
- "transformers_version": "4.39.1",
32
  "use_cache": true,
33
  "vocab_size": 256206
34
  }
 
27
  "num_hidden_layers": 24,
28
  "pad_token_id": 1,
29
  "scale_embedding": true,
30
+ "torch_dtype": "bfloat16",
31
+ "transformers_version": "4.41.2",
32
  "use_cache": true,
33
  "vocab_size": 256206
34
  }
generation_config.json CHANGED
@@ -5,5 +5,5 @@
5
  "eos_token_id": 2,
6
  "max_length": 200,
7
  "pad_token_id": 1,
8
- "transformers_version": "4.39.1"
9
  }
 
5
  "eos_token_id": 2,
6
  "max_length": 200,
7
  "pad_token_id": 1,
8
+ "transformers_version": "4.41.2"
9
  }
pytorch_model.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fcd63ef1441f3c3fb6c579676bc0d22fd4faea09f9f7c5ee8dc706bab02e426b
3
+ size 6689870958
status.json CHANGED
@@ -1,4 +1,9 @@
1
  {
2
- "best_valid_loss": 0.6721298055989402,
3
- "best_train_loss": 0.20154881566216093
 
 
 
 
 
4
  }
 
1
  {
2
+ "best_train_loss": 1.0126271802325582,
3
+ "best_valid_loss": 1.7447916666666667,
4
+ "epoch": 2,
5
+ "epoch_step": 85,
6
+ "global_step": 330,
7
+ "eval_global_step": 33,
8
+ "evaluations_done": 11
9
  }