graphcore-rahult commited on
Commit
3111a0b
·
1 Parent(s): 4210d46

Training in progress, step 500

Browse files
Files changed (4) hide show
  1. config.json +1 -1
  2. ipu_config.json +4 -7
  3. pytorch_model.bin +1 -1
  4. training_args.bin +2 -2
config.json CHANGED
@@ -33,7 +33,7 @@
33
  }
34
  },
35
  "torch_dtype": "float16",
36
- "transformers_version": "4.18.0",
37
  "use_cache": true,
38
  "vocab_size": 50257
39
  }
 
33
  }
34
  },
35
  "torch_dtype": "float16",
36
+ "transformers_version": "4.20.1",
37
  "use_cache": true,
38
  "vocab_size": 50257
39
  }
ipu_config.json CHANGED
@@ -1,10 +1,9 @@
1
  {
2
- "decompose_grad_sum": false,
3
  "device_iterations": 2,
4
  "embedding_serialization_factor": 4,
5
- "enable_half_first_order_momentum": true,
6
  "enable_half_partials": true,
7
- "executable_cache_dir": "./exe_cache",
8
  "execute_encoder_on_cpu_for_generation": false,
9
  "gradient_accumulation_steps": 16,
10
  "inference_device_iterations": 5,
@@ -18,14 +17,12 @@
18
  ],
19
  "matmul_proportion": 0.25,
20
  "optimizer_state_offchip": true,
21
- "optimum_version": "1.1.1",
22
  "output_mode": "final",
23
- "profile_dir": "",
24
  "recompute_checkpoint_every_layer": true,
25
  "replicated_tensor_sharding": false,
26
  "replication_factor": 1,
27
  "seed": 42,
28
  "sharded_execution_for_inference": false,
29
- "transformers_version": "4.18.0",
30
- "use_popdist": false
31
  }
 
1
  {
2
+ "auto_loss_scaling": false,
3
  "device_iterations": 2,
4
  "embedding_serialization_factor": 4,
 
5
  "enable_half_partials": true,
6
+ "executable_cache_dir": "/tmp/exe_cache",
7
  "execute_encoder_on_cpu_for_generation": false,
8
  "gradient_accumulation_steps": 16,
9
  "inference_device_iterations": 5,
 
17
  ],
18
  "matmul_proportion": 0.25,
19
  "optimizer_state_offchip": true,
20
+ "optimum_version": "1.5.1",
21
  "output_mode": "final",
 
22
  "recompute_checkpoint_every_layer": true,
23
  "replicated_tensor_sharding": false,
24
  "replication_factor": 1,
25
  "seed": 42,
26
  "sharded_execution_for_inference": false,
27
+ "transformers_version": "4.20.1"
 
28
  }
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2ec41fd9943e837076f0f51e71ade17eb70d2dddb442c721514ecb861ec5d721
3
  size 261514473
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:98be7a37645b50ad99a01b1d44d9ab4abd27738bff597b76c13b02edde1f3ed6
3
  size 261514473
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:388d799c1733715ab6da9bab9bd736a7df5fcaaafd9649521d4019e8b3b08e3c
3
- size 2671
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:48abb1513a620a1159d070ffd661e2132964549a3d5f8120b3953f4519b604ca
3
+ size 2735