Saving weights and logs of step 500
Browse files- config.json +1 -1
- events.out.tfevents.1631191833.t1v-n-4e27a527-w-0.1937094.0.v2 +3 -0
- flax_model.msgpack +1 -1
- run.sh +1 -1
config.json
CHANGED
@@ -65,7 +65,7 @@
|
|
65 |
}
|
66 |
},
|
67 |
"tokenizer_class": "GPT2Tokenizer",
|
68 |
-
"transformers_version": "4.
|
69 |
"use_cache": true,
|
70 |
"vocab_size": 50264,
|
71 |
"window_size": 256
|
|
|
65 |
}
|
66 |
},
|
67 |
"tokenizer_class": "GPT2Tokenizer",
|
68 |
+
"transformers_version": "4.11.0.dev0",
|
69 |
"use_cache": true,
|
70 |
"vocab_size": 50264,
|
71 |
"window_size": 256
|
events.out.tfevents.1631191833.t1v-n-4e27a527-w-0.1937094.0.v2
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:121d2e96899f6772a57b1228900bcbfd6ba74fa50e4982f41b305cb7571b56c2
|
3 |
+
size 40
|
flax_model.msgpack
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 5262371934
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:21114569ff0ec5434ff6b47f5b8b254ab174c5ba6c4ece5f7edd4b8a7526ece0
|
3 |
size 5262371934
|
run.sh
CHANGED
@@ -11,7 +11,7 @@ python run_clm_mp.py \
|
|
11 |
--per_device_train_batch_size 2 \
|
12 |
--per_device_eval_batch_size 2 \
|
13 |
--overwrite_output_dir \
|
14 |
-
--output_dir
|
15 |
--cache_dir /mnt/disks/flaxdisk/cache/ \
|
16 |
--preprocessing_num_workers 96 \
|
17 |
--dtype bfloat16 \
|
|
|
11 |
--per_device_train_batch_size 2 \
|
12 |
--per_device_eval_batch_size 2 \
|
13 |
--overwrite_output_dir \
|
14 |
+
--output_dir "./" \
|
15 |
--cache_dir /mnt/disks/flaxdisk/cache/ \
|
16 |
--preprocessing_num_workers 96 \
|
17 |
--dtype bfloat16 \
|