pere commited on
Commit
5c4a811
1 Parent(s): 056f543

Saving weights and logs of step 179307

Browse files
events.out.tfevents.1633618406.t1v-n-4e27a527-w-0.192304.0.v2 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:607afd35063035f39f517563d179d70394581ceab589fc16180981b815b3a03e
3
+ size 22317230
flax_model.msgpack CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5b90c9c809494625d737d5745a2996027c90a772e5d1d47773e008de96dbfd20
3
  size 5262371934
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cd89c66b4400cf75a191a2817c2939e3feee5bddaa5f5b7e26bc5f1e57d25729
3
  size 5262371934
run.sh CHANGED
@@ -5,11 +5,11 @@ python run_clm_mp.py \
5
  --validation_file /mnt/disks/flaxdisk/corpus/social_validation.json \
6
  --do_train \
7
  --do_eval \
8
- --block_size 1024 \
9
  --num_train_epochs 5 \
10
- --learning_rate 1e-5 \
11
- --per_device_train_batch_size 2 \
12
- --per_device_eval_batch_size 2 \
13
  --overwrite_output_dir \
14
  --output_dir "./" \
15
  --cache_dir /mnt/disks/flaxdisk/cache/ \
 
5
  --validation_file /mnt/disks/flaxdisk/corpus/social_validation.json \
6
  --do_train \
7
  --do_eval \
8
+ --block_size 512 \
9
  --num_train_epochs 5 \
10
+ --learning_rate 4e-6 \
11
+ --per_device_train_batch_size 4 \
12
+ --per_device_eval_batch_size 4 \
13
  --overwrite_output_dir \
14
  --output_dir "./" \
15
  --cache_dir /mnt/disks/flaxdisk/cache/ \