File size: 1,428 Bytes
fed630b
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
{
  "adaptive_clipping": true,
  "audio_aligner_type": "audio_sa_3_3_pool_2",
  "audio_lora": false,
  "audio_lora_rank": 8,
  "audio_model_type": "hubert",
  "audio_pool_width": 1,
  "cal_balance_weight": 0.1,
  "cal_init": 1.0,
  "channel_dropout": 0.0,
  "code_dim": 384,
  "disentangle_weight": 0.0,
  "finetune_audio_model": true,
  "finetune_image_model": false,
  "gather_tensors": true,
  "gradient_clipping": 10.0,
  "head_agg": "max_elementwise",
  "image_aligner_type": "image_linear",
  "image_lora": true,
  "image_lora_rank": 8,
  "image_model_token_type": "token",
  "image_model_type": "dino8",
  "image_pool_width": 2,
  "learn_audio_cls": true,
  "loss_leak": 0.0,
  "loss_margin": 0.0,
  "loss_type": "nce",
  "lr": 5e-05,
  "lr_cycle_length": 50000,
  "lr_schedule": null,
  "lr_warmup": 1000,
  "mask_silence": true,
  "memory_buffer_size": 0,
  "mixup_weight": 0.0,
  "neg_audio": true,
  "neg_audio_weight": 0.01,
  "nonneg_pressure": 0.01,
  "nonneg_sim": false,
  "norm_vectors": false,
  "optimizer": "adam",
  "output_root": "/mnt/azureml/cr/j/7e4ff299c6de48ee8bd4222906d5eca7/cap/data-capability/wd/INPUT_video_analysis_store_3_video_analysis_store_3",
  "pretrain_lr": 5e-05,
  "silence_l1": 0.01,
  "silence_l2": 0.0,
  "sim_agg_heads": 1,
  "sim_agg_type": "misa",
  "sim_use_cls": false,
  "spatial_dropout": 0.0,
  "specialization_weight": 0.05,
  "tv_weight": 0.01,
  "use_cached_embs": false
}