pere commited on
Commit
d2e0660
1 Parent(s): 6087912

Saving weights and logs of step 500

Browse files
config.json CHANGED
@@ -65,7 +65,7 @@
65
  }
66
  },
67
  "tokenizer_class": "GPT2Tokenizer",
68
- "transformers_version": "4.9.0.dev0",
69
  "use_cache": true,
70
  "vocab_size": 50264,
71
  "window_size": 256
 
65
  }
66
  },
67
  "tokenizer_class": "GPT2Tokenizer",
68
+ "transformers_version": "4.11.0.dev0",
69
  "use_cache": true,
70
  "vocab_size": 50264,
71
  "window_size": 256
events.out.tfevents.1631191833.t1v-n-4e27a527-w-0.1937094.0.v2 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:121d2e96899f6772a57b1228900bcbfd6ba74fa50e4982f41b305cb7571b56c2
3
+ size 40
flax_model.msgpack CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c694052f126d1176eaa04c0dffd77b0c49a301f6677b83a9d39d4a61f3c59ccc
3
  size 5262371934
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:21114569ff0ec5434ff6b47f5b8b254ab174c5ba6c4ece5f7edd4b8a7526ece0
3
  size 5262371934
run.sh CHANGED
@@ -11,7 +11,7 @@ python run_clm_mp.py \
11
  --per_device_train_batch_size 2 \
12
  --per_device_eval_batch_size 2 \
13
  --overwrite_output_dir \
14
- --output_dir /mnt/disks/flaxdisk/output/ \
15
  --cache_dir /mnt/disks/flaxdisk/cache/ \
16
  --preprocessing_num_workers 96 \
17
  --dtype bfloat16 \
 
11
  --per_device_train_batch_size 2 \
12
  --per_device_eval_batch_size 2 \
13
  --overwrite_output_dir \
14
+ --output_dir "./" \
15
  --cache_dir /mnt/disks/flaxdisk/cache/ \
16
  --preprocessing_num_workers 96 \
17
  --dtype bfloat16 \