Saving weights and logs of step 10000

Files changed (4) hide show

config.json CHANGED Viewed

@@ -1,5 +1,5 @@
 {
-  "_name_or_path": "roberta-large",
   "architectures": [
     "RobertaForMaskedLM"
   ],

 {
+  "_name_or_path": "./",
   "architectures": [
     "RobertaForMaskedLM"
   ],

events.out.tfevents.1637523639.t1v-n-8eba1090-w-0.295438.0.v2 ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:7dab021a8cc85a18e8d99a685190cf5559b1a15e91bd9964d83f3e2f5aa039a0
+size 1470757

flax_model.msgpack ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:a812e90865843a99f72e21007b3cd0eb29c4ab2ffa06216290434f9f04324333
+size 1421662309

start_train.sh CHANGED Viewed

@@ -1,5 +1,6 @@
 # set train hyperparams
 unset LD_PRELOAD
 python3 run_mlm_flax.py \
     --output_dir="./" \
     --model_type="roberta" \

 # set train hyperparams
 unset LD_PRELOAD
+export HF_DATASETS_CACHE="/researchdisk/datasets_cache"
 python3 run_mlm_flax.py \
     --output_dir="./" \
     --model_type="roberta" \