Jinchen commited on
Commit
62bebc6
1 Parent(s): 19d48cb

Training in progress, step 500

Browse files
Files changed (3) hide show
  1. ipu_config.json +10 -4
  2. pytorch_model.bin +2 -2
  3. training_args.bin +2 -2
ipu_config.json CHANGED
@@ -1,12 +1,13 @@
1
  {
 
2
  "decompose_grad_sum": false,
3
- "device_iterations": 2,
4
- "embedding_serialization_factor": 4,
5
  "enable_half_first_order_momentum": true,
6
  "enable_half_partials": true,
7
  "executable_cache_dir": "./exe_cache",
8
  "execute_encoder_on_cpu_for_generation": false,
9
- "gradient_accumulation_steps": 64,
10
  "inference_device_iterations": 5,
11
  "inference_replication_factor": 4,
12
  "ipus_per_replica": 4,
@@ -16,7 +17,12 @@
16
  4,
17
  4
18
  ],
19
- "matmul_proportion": 0.25,
 
 
 
 
 
20
  "optimizer_state_offchip": true,
21
  "optimum_version": "1.3.0",
22
  "output_mode": "final",
 
1
  {
2
+ "auto_loss_scaling": false,
3
  "decompose_grad_sum": false,
4
+ "device_iterations": 1,
5
+ "embedding_serialization_factor": 2,
6
  "enable_half_first_order_momentum": true,
7
  "enable_half_partials": true,
8
  "executable_cache_dir": "./exe_cache",
9
  "execute_encoder_on_cpu_for_generation": false,
10
+ "gradient_accumulation_steps": 16,
11
  "inference_device_iterations": 5,
12
  "inference_replication_factor": 4,
13
  "ipus_per_replica": 4,
 
17
  4,
18
  4
19
  ],
20
+ "matmul_proportion": [
21
+ 0.25,
22
+ 0.25,
23
+ 0.25,
24
+ 0.25
25
+ ],
26
  "optimizer_state_offchip": true,
27
  "optimum_version": "1.3.0",
28
  "output_mode": "final",
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:bc52b84cb95a5b6b6b240355ea46fc7d9e6554e531dbe267b566a047a2481499
3
- size 261514473
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1854dafd8849f3aac5d15e43a378d11f97efab3a84b6131e2aabceb48e4675fc
3
+ size 162657115
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8ee5f4f3b3d5de4e91c70cda2cbf0ccfdf8ca6bf37533031273cc536c8edc58d
3
- size 2607
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3a02d178f04ca1e4f706509a8c510c6ef45c0cdb20d4bd5e0ea009974c779701
3
+ size 2671