versae's picture
Saving weights and logs of step 1000
9c3de9e
{
"os": "Linux-5.4.0-1043-gcp-x86_64-with-glibc2.29",
"python": "3.8.10",
"heartbeatAt": "2022-01-14T21:28:58.974844",
"startedAt": "2022-01-14T21:28:55.397355",
"docker": null,
"cpu_count": 96,
"cuda": null,
"args": [
"--output_dir=./",
"--model_type=roberta",
"--config_name=roberta-base",
"--tokenizer_name=NbAiLab/nb-roberta-base",
"--dataset_name=NbAiLab/NCC",
"--max_seq_length=128",
"--weight_decay=0.01",
"--per_device_train_batch_size=250",
"--per_device_eval_batch_size=250",
"--pad_to_max_length",
"--learning_rate=6e-4",
"--warmup_steps=10000",
"--overwrite_output_dir",
"--num_train_epochs=3",
"--adam_beta1=0.9",
"--adam_beta2=0.98",
"--adam_epsilon=1e-6",
"--logging_steps=1000",
"--save_steps=1000",
"--eval_steps=1000",
"--do_train",
"--do_eval",
"--dtype=bfloat16",
"--push_to_hub"
],
"state": "running",
"program": "run_mlm_flax.py",
"codePath": "run_mlm_flax.py",
"git": {
"remote": "https://huggingface.co/versae/roberta-base-ncc",
"commit": "502df078f73cf93ca9380fcac1c9b9c7598a445f"
},
"email": "versae@gmail.com",
"root": "/data/roberta-base-ncc",
"host": "t1v-n-eedfb410-w-0",
"username": "javierr",
"executable": "/data/flax/bin/python"
}