graphcore-rahult commited on
Commit
49023e6
1 Parent(s): ddd68f7

Training in progress, step 500

Browse files
Files changed (4) hide show
  1. config.json +1 -1
  2. ipu_config.json +1 -1
  3. pytorch_model.bin +1 -1
  4. training_args.bin +1 -1
config.json CHANGED
@@ -1,7 +1,7 @@
1
  {
2
  "_name_or_path": "bert-base-cased",
3
  "architectures": [
4
- "PipelinedBertForMaskedLM"
5
  ],
6
  "attention_probs_dropout_prob": 0.1,
7
  "classifier_dropout": null,
 
1
  {
2
  "_name_or_path": "bert-base-cased",
3
  "architectures": [
4
+ "PoptorchPipelinedBertForMaskedLM"
5
  ],
6
  "attention_probs_dropout_prob": 0.1,
7
  "classifier_dropout": null,
ipu_config.json CHANGED
@@ -3,7 +3,7 @@
3
  "device_iterations": 1,
4
  "embedding_serialization_factor": 0,
5
  "enable_half_partials": true,
6
- "executable_cache_dir": "/tmp/exe_cache",
7
  "execute_encoder_on_cpu_for_generation": false,
8
  "gradient_accumulation_steps": 64,
9
  "inference_device_iterations": 5,
 
3
  "device_iterations": 1,
4
  "embedding_serialization_factor": 0,
5
  "enable_half_partials": true,
6
+ "executable_cache_dir": "/tmp/exe_cache/language_modelling_from_scratch",
7
  "execute_encoder_on_cpu_for_generation": false,
8
  "gradient_accumulation_steps": 64,
9
  "inference_device_iterations": 5,
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0d19494fe316c8a48e054cada738b0e7e89497ce361b69da6376fcbcac02d302
3
  size 216750379
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8dda0f0e8c290dcaedb6403fc755cb91b3b0416cb726e5e23d058a6fafa30e73
3
  size 216750379
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:79bc3e1524c49a1c09ce54d5693c306e5d7f0159d52c0fd9c13f41371bb32c4f
3
  size 2735
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e564c5deff8c739fa6d9877ca2c8d1cbdedc008228e1b61154607bb8d65daf2f
3
  size 2735