boris commited on
Commit
e1555d4
1 Parent(s): dc5c024

feat: update sweep

Browse files
Files changed (1) hide show
  1. tools/train/sweep.yaml +25 -30
tools/train/sweep.yaml CHANGED
@@ -11,44 +11,39 @@ parameters:
11
  # from exp(min) to exp(max)
12
  min: -6.9
13
  max: -3.5
 
 
 
 
 
 
 
 
 
 
 
 
14
  gradient_accumulation_steps:
15
- value: 8
16
  warmup_steps:
17
  value: 4000
18
- #TODO: outdated command
 
 
 
 
 
 
 
 
19
  command:
20
  - python3
21
  - ${program}
22
- - "--tokenizer_name"
23
- - "boris/dalle-mini-tokenizer"
24
- - "--config_name"
25
- - "facebook/bart-large-cnn"
26
- - "--dataset_repo_or_path"
27
- - "boris/gis_vqgan_f16_16384"
28
  - "--streaming"
29
- - "--use_auth_token"
30
- - "--image_vocab_size"
31
- - 16384
32
- - "--image_length"
33
- - 256
34
- - "--normalize_text"
35
- - True
36
- - "--per_device_train_batch_size"
37
- - 56
38
- - "--per_device_eval_batch_size"
39
- - 56
40
- - "--adafactor"
41
- - "--do_train"
42
- - "--do_eval"
43
- - "--num_train_epochs"
44
- - 1
45
- - "--logging_steps"
46
- - 40
47
- - "--eval_steps"
48
- - 800
49
  - "--output_dir"
50
  - "./output"
51
  - "--overwrite_output_dir"
52
- - "--max_train_samples"
53
- - 10000000
 
54
  - ${args}
 
11
  # from exp(min) to exp(max)
12
  min: -6.9
13
  max: -3.5
14
+ tokenizer_name:
15
+ value: boris/dalle-mini-tokenizer
16
+ config_name:
17
+ value: ./config/mini
18
+ dtype:
19
+ value: bfloat16
20
+ dataset_repo_or_path:
21
+ value: ./data
22
+ per_device_train_batch_size:
23
+ value: 64
24
+ per_device_eval_batch_size:
25
+ value: 64
26
  gradient_accumulation_steps:
27
+ value: 1
28
  warmup_steps:
29
  value: 4000
30
+ num_train_epochs:
31
+ value: 1
32
+ logging_steps:
33
+ value: 32
34
+ eval_steps:
35
+ value: 800
36
+ max_train_samples:
37
+ value: 1000000
38
+
39
  command:
40
  - python3
41
  - ${program}
 
 
 
 
 
 
42
  - "--streaming"
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
43
  - "--output_dir"
44
  - "./output"
45
  - "--overwrite_output_dir"
46
+ - "--adafactor"
47
+ - "--do_train"
48
+ - "--do_eval"
49
  - ${args}