dalle-mini / tools /train /sweep.yaml
boris's picture
feat(train): update sweep config
bbbf7c8
raw history blame
No virus
883 Bytes
program: train.py
project: dalle-mini
method: random
metric:
name: eval/loss
goal: minimize
parameters:
optim:
value: distributed_shampoo
learning_rate:
distribution: log_uniform
# from exp(min) to exp(max)
min: -9.2
max: -6.9
tokenizer_name:
value: boris/dalle-mini-tokenizer
config_name:
value: ./config/mini
dtype:
value: bfloat16
dataset_repo_or_path:
value: ./data
per_device_train_batch_size:
value: 64
per_device_eval_batch_size:
value: 64
gradient_accumulation_steps:
value: 1
warmup_steps:
value: 1000
num_train_epochs:
value: 1
max_train_samples:
value: 1000000
logging_steps:
value: 40
eval_steps:
value: 200
command:
- python3
- ${program}
- "--streaming"
- "--output_dir"
- "./output"
- "--overwrite_output_dir"
- "--do_train"
- "--do_eval"
- ${args}