yhavinga commited on
Commit
446c112
1 Parent(s): 1833387

Saving weights and logs of step 300

Browse files
flax_model.msgpack CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:017c34e041bd61f90e1e78c986113b87116dbefe5ed2db7c8343058b9b025a6e
3
  size 891548548
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f1d8c763d288f266b49c1a11c5f341c28fd493185af0e577eb4f972c9de4afd8
3
  size 891548548
run_t5.sh CHANGED
@@ -17,10 +17,10 @@ mkdir -p "${MODEL_DIR}/runs"
17
  --do_train --do_eval \
18
  --adafactor \
19
  --max_seq_length="512" \
20
- --gradient_accumulation_steps="16" \
21
  --per_device_train_batch_size="32" \
22
  --per_device_eval_batch_size="32" \
23
- --learning_rate="5e-3" \
 
24
  --overwrite_output_dir \
25
  --num_train_epochs="1" \
26
  --logging_steps="15" \
@@ -32,6 +32,7 @@ mkdir -p "${MODEL_DIR}/runs"
32
  #git commit -m "Update pytorch model after training"
33
  #git push origin main
34
 
 
 
35
 
36
- # --dtype="bfloat16" \
37
- # --resume_from_checkpoint="${MODEL_DIR}/ckpt-3300" \
 
17
  --do_train --do_eval \
18
  --adafactor \
19
  --max_seq_length="512" \
 
20
  --per_device_train_batch_size="32" \
21
  --per_device_eval_batch_size="32" \
22
+ --learning_rate="1e-2" \
23
+ --dtype="bfloat16" \
24
  --overwrite_output_dir \
25
  --num_train_epochs="1" \
26
  --logging_steps="15" \
 
32
  #git commit -m "Update pytorch model after training"
33
  #git push origin main
34
 
35
+ # --learning_rate="5e-3" \
36
+ # --gradient_accumulation_steps="2" \
37
 
38
+ # --resume_from_checkpoint="${MODEL_DIR}/ckpt-3300" \
 
runs/Jul10_07-45-49_t1v-n-0e7426e8-w-0/events.out.tfevents.1625903173.t1v-n-0e7426e8-w-0.20563.3.v2 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:bc901d2e6b8e7e9bb6834c37930f08ed3dd4704877c26d80a07afe26132d6168
3
- size 136359
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:07af3cc1b9177077621a9f9cd2b3d36aa028237973caf686c9e324e89cc25de9
3
+ size 147729
runs/Jul10_08-38-10_t1v-n-0e7426e8-w-0/events.out.tfevents.1625906314.t1v-n-0e7426e8-w-0.25839.3.v2 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f87e0b93569f9ebb013314589bc05f05421f4cad6c6903192a28805a6a75ca26
3
+ size 45399