graphcore-rahult commited on
Commit
e2b24b7
1 Parent(s): daed369

Training in progress, step 500

Browse files
Files changed (4) hide show
  1. config.json +1 -1
  2. ipu_config.json +3 -3
  3. pytorch_model.bin +1 -1
  4. training_args.bin +1 -1
config.json CHANGED
@@ -5,7 +5,7 @@
5
  "add_bias_logits": false,
6
  "add_final_layer_norm": false,
7
  "architectures": [
8
- "PipelinedBartForConditionalGeneration"
9
  ],
10
  "attention_dropout": 0.1,
11
  "bos_token_id": 0,
 
5
  "add_bias_logits": false,
6
  "add_final_layer_norm": false,
7
  "architectures": [
8
+ "PoptorchPipelinedBartForConditionalGeneration"
9
  ],
10
  "attention_dropout": 0.1,
11
  "bos_token_id": 0,
ipu_config.json CHANGED
@@ -7,7 +7,7 @@
7
  "execute_encoder_on_cpu_for_generation": false,
8
  "gradient_accumulation_steps": 128,
9
  "inference_device_iterations": 6,
10
- "inference_replication_factor": 4,
11
  "ipus_per_replica": 4,
12
  "layers_per_ipu": [
13
  0,
@@ -25,8 +25,8 @@
25
  "optimum_version": "1.5.1",
26
  "output_mode": "final",
27
  "recompute_checkpoint_every_layer": true,
28
- "replicated_tensor_sharding": true,
29
- "replication_factor": 4,
30
  "seed": 42,
31
  "sharded_execution_for_inference": false,
32
  "transformers_version": "4.20.1"
 
7
  "execute_encoder_on_cpu_for_generation": false,
8
  "gradient_accumulation_steps": 128,
9
  "inference_device_iterations": 6,
10
+ "inference_replication_factor": 1,
11
  "ipus_per_replica": 4,
12
  "layers_per_ipu": [
13
  0,
 
25
  "optimum_version": "1.5.1",
26
  "output_mode": "final",
27
  "recompute_checkpoint_every_layer": true,
28
+ "replicated_tensor_sharding": false,
29
+ "replication_factor": 1,
30
  "seed": 42,
31
  "sharded_execution_for_inference": false,
32
  "transformers_version": "4.20.1"
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5187b7724855d803586b9715d32e4c6c8f7579377b719b48fb6d137aad166753
3
  size 279024057
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:884fbc940cd53ff641c808384929b4e2902ce4541b38457b090b52fe2874f0af
3
  size 279024057
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3123096a95a2e86c9ed51435f10bf85c58130ef41ec57a9517702e555c9c5b46
3
  size 2863
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4134102b42655682ff52c24e250b07795be661936bf3e898f217579d9a64a3f1
3
  size 2863