liho00 commited on
Commit
3feaa12
1 Parent(s): ae525f6

Upload training_config.yml with huggingface_hub

Browse files
Files changed (1) hide show
  1. training_config.yml +7 -7
training_config.yml CHANGED
@@ -21,12 +21,12 @@ checkpointer:
21
  recipe_checkpoint: null
22
  output_dir: output_checkpoints/experiment_1
23
  model_type: LLAMA3
24
- resume_from_checkpoint: true
25
  interim_checkpoint_steps: 5000
26
  interim_gen_steps: null
27
  max_new_tokens: 100
28
- temperature: 0.6
29
- top_k: 300
30
  dataset:
31
  _component_: ds.EvenBatcher
32
  buffer_size: 36
@@ -46,7 +46,7 @@ dataset:
46
  train_on_input: false
47
  seed: null
48
  shuffle: true
49
- batch_size: 4
50
  optimizer:
51
  _component_: torch.optim.AdamW
52
  weight_decay: 0.01
@@ -77,8 +77,8 @@ inference:
77
  {video}
78
 
79
  Caption the previous video.'
80
- max_new_tokens: 300
81
- temperature: 0.6
82
- top_k: 300
83
  quantizer: null
84
  gradient-accumulation-steps: 32
 
21
  recipe_checkpoint: null
22
  output_dir: output_checkpoints/experiment_1
23
  model_type: LLAMA3
24
+ resume_from_checkpoint: false
25
  interim_checkpoint_steps: 5000
26
  interim_gen_steps: null
27
  max_new_tokens: 100
28
+ temperature: 0.8
29
+ top_k: 333
30
  dataset:
31
  _component_: ds.EvenBatcher
32
  buffer_size: 36
 
46
  train_on_input: false
47
  seed: null
48
  shuffle: true
49
+ batch_size: 6
50
  optimizer:
51
  _component_: torch.optim.AdamW
52
  weight_decay: 0.01
 
77
  {video}
78
 
79
  Caption the previous video.'
80
+ max_new_tokens: 333
81
+ temperature: 0.8
82
+ top_k: 333
83
  quantizer: null
84
  gradient-accumulation-steps: 32