Saving weights and logs of step 179307
Browse files
events.out.tfevents.1633618406.t1v-n-4e27a527-w-0.192304.0.v2
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:607afd35063035f39f517563d179d70394581ceab589fc16180981b815b3a03e
|
3 |
+
size 22317230
|
flax_model.msgpack
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 5262371934
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cd89c66b4400cf75a191a2817c2939e3feee5bddaa5f5b7e26bc5f1e57d25729
|
3 |
size 5262371934
|
run.sh
CHANGED
@@ -5,11 +5,11 @@ python run_clm_mp.py \
|
|
5 |
--validation_file /mnt/disks/flaxdisk/corpus/social_validation.json \
|
6 |
--do_train \
|
7 |
--do_eval \
|
8 |
-
--block_size
|
9 |
--num_train_epochs 5 \
|
10 |
-
--learning_rate
|
11 |
-
--per_device_train_batch_size
|
12 |
-
--per_device_eval_batch_size
|
13 |
--overwrite_output_dir \
|
14 |
--output_dir "./" \
|
15 |
--cache_dir /mnt/disks/flaxdisk/cache/ \
|
|
|
5 |
--validation_file /mnt/disks/flaxdisk/corpus/social_validation.json \
|
6 |
--do_train \
|
7 |
--do_eval \
|
8 |
+
--block_size 512 \
|
9 |
--num_train_epochs 5 \
|
10 |
+
--learning_rate 4e-6 \
|
11 |
+
--per_device_train_batch_size 4 \
|
12 |
+
--per_device_eval_batch_size 4 \
|
13 |
--overwrite_output_dir \
|
14 |
--output_dir "./" \
|
15 |
--cache_dir /mnt/disks/flaxdisk/cache/ \
|