panini / .vscode /launch.json
amank
Made change to cleaning code, modified number of warmpu step, getting eval samples from validation split
7839b8e
{
// Use IntelliSense to learn about possible attributes.
// Hover to view descriptions of existing attributes.
// For more information, visit: https://go.microsoft.com/fwlink/?linkid=830387
"version": "0.2.0",
"configurations": [
{
"name": "Python: StreamingFile",
"type": "python",
"request": "launch",
"program": "${file}",
"args": [
"--output_dir","roberta_mc4_sentence_piece",
"--model_type","roberta",
"--config_name","roberta_mc4_sentence_piece",
"--tokenizer_name","roberta_mc4_sentence_piece",
"--dataset_name","mc4",
"--dataset_config_name","hi",
"--max_seq_length","256",
"--per_device_train_batch_size","16",
"--per_device_eval_batch_size","16",
"--learning_rate","3e-4",
"--warmup_steps","1000",
"--overwrite_output_dir",
"--adam_beta1","0.9",
"--adam_beta2","0.98",
"--num_train_steps","10000",
"--num_eval_samples","5000",
"--preprocessing_num_workers", "90",
"--logging_steps","250",
"--eval_steps","1000"
],
"console": "integratedTerminal"
},
{
"name": "Python: Current File",
"type": "python",
"request": "launch",
"program": "${file}",
"console": "integratedTerminal"
}
]
}