graphcore-rahult commited on
Commit
3798d10
1 Parent(s): df6f8ea

Training in progress, step 500

Browse files
Files changed (4) hide show
  1. config.json +1 -1
  2. ipu_config.json +3 -3
  3. pytorch_model.bin +1 -1
  4. training_args.bin +1 -1
config.json CHANGED
@@ -1,7 +1,7 @@
1
  {
2
  "_name_or_path": "t5-small",
3
  "architectures": [
4
- "PipelinedT5ForConditionalGeneration"
5
  ],
6
  "d_ff": 2048,
7
  "d_kv": 64,
 
1
  {
2
  "_name_or_path": "t5-small",
3
  "architectures": [
4
+ "PoptorchPipelinedT5ForConditionalGeneration"
5
  ],
6
  "d_ff": 2048,
7
  "d_kv": 64,
ipu_config.json CHANGED
@@ -7,7 +7,7 @@
7
  "execute_encoder_on_cpu_for_generation": false,
8
  "gradient_accumulation_steps": 16,
9
  "inference_device_iterations": 5,
10
- "inference_replication_factor": 4,
11
  "ipus_per_replica": 4,
12
  "layers_per_ipu": [
13
  0,
@@ -25,8 +25,8 @@
25
  "optimum_version": "1.5.1",
26
  "output_mode": "final",
27
  "recompute_checkpoint_every_layer": true,
28
- "replicated_tensor_sharding": true,
29
- "replication_factor": 4,
30
  "seed": 42,
31
  "sharded_execution_for_inference": false,
32
  "transformers_version": "4.20.1"
 
7
  "execute_encoder_on_cpu_for_generation": false,
8
  "gradient_accumulation_steps": 16,
9
  "inference_device_iterations": 5,
10
+ "inference_replication_factor": 1,
11
  "ipus_per_replica": 4,
12
  "layers_per_ipu": [
13
  0,
 
25
  "optimum_version": "1.5.1",
26
  "output_mode": "final",
27
  "recompute_checkpoint_every_layer": true,
28
+ "replicated_tensor_sharding": false,
29
+ "replication_factor": 1,
30
  "seed": 42,
31
  "sharded_execution_for_inference": false,
32
  "transformers_version": "4.20.1"
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:40c97cabd74f9b644ac40d65c3f3ab45f006ef8c78771900288aee31ef9a6f1a
3
  size 121055163
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8e8eac098140367a0fba1d56738c96b0c4c1a7187074a8a6d7d5bfaed35afd88
3
  size 121055163
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:fdc004737cc12876f67d3c4fcd973cd086389ae76352752738debbe5baebd259
3
  size 2863
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b39b8d2451a66013ad718ab0cf6f9124df1f0733b578b11613d6fbb094ec3154
3
  size 2863