yhavinga
/

gpt2-medium-dutch

Text Generation

text-generation-inference

Inference Endpoints

Model card Files Files and versions Metrics Training metrics Community

yhavinga commited on Dec 21, 2021

Commit

f82139d

·

1 Parent(s): 233fa8e

Update run config

Files changed (1) hide show

run_gpt.sh +4 -2

run_gpt.sh CHANGED Viewed

@@ -4,7 +4,7 @@ export HF_PROJECT="gpt2-medium-dutch"
 # Variables for training the tokenizer and creating the config
 export VOCAB_SIZE="50257"
-export DATASET="yhavinga/mc4_nl_cleaned" # Name of the dataset in the Huggingface Hub
 export DATASET_CONFIG="full" # Config of the dataset in the Huggingface Hub
 export DATASET_SPLIT="train" # Split to use for training tokenizer and model
 export TEXT_FIELD="text" # Field containing the text to be used for training
@@ -26,7 +26,9 @@ python run_clm_flax.py \
     --learning_rate="0.0024" --warmup_steps="5000" \
     --adam_beta1="0.9" --adam_beta2="0.98" --weight_decay="0.01" \
     --overwrite_output_dir \
-    --num_train_epochs="4" \
     --logging_steps="500" \
     --save_steps="40000" \
     --eval_steps="2500" \

 # Variables for training the tokenizer and creating the config
 export VOCAB_SIZE="50257"
+export DATASET="/home/yeb/data/mc4_nl_cleaned/mc4_nl_cleaned.py" # Name of the dataset in the Huggingface Hub
 export DATASET_CONFIG="full" # Config of the dataset in the Huggingface Hub
 export DATASET_SPLIT="train" # Split to use for training tokenizer and model
 export TEXT_FIELD="text" # Field containing the text to be used for training
     --learning_rate="0.0024" --warmup_steps="5000" \
     --adam_beta1="0.9" --adam_beta2="0.98" --weight_decay="0.01" \
     --overwrite_output_dir \
+    --num_train_epochs="2" \
+    --dataloader_num_workers="64" \
+    --preprocessing_num_workers="64" \
     --logging_steps="500" \
     --save_steps="40000" \
     --eval_steps="2500" \