tanthinhdt commited on
Commit
7382540
1 Parent(s): f1b22b0

Upload vsl_s2g-2024-03-04_08-52-53/vsl_s2g.yaml with huggingface_hub

Browse files
vsl_s2g-2024-03-04_08-52-53/vsl_s2g.yaml ADDED
@@ -0,0 +1,67 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ task: S2G
2
+ data:
3
+ name: vsl
4
+ subset: rgb_videos
5
+ num_proc: 24
6
+ cache_dir: data/external/huggingface
7
+ input_streams:
8
+ - rgb
9
+ level: word #word or char
10
+ txt_lowercase: true
11
+ max_sent_length: 400
12
+ transform_cfg:
13
+ rand_crop_size: 224
14
+ rand_crop_threshold: 0.7
15
+ rand_crop_bottom_area: 0.7
16
+ rand_crop_aspect_ratio_min: 0.75
17
+ rand_crop_aspect_ratio_max: 1.3
18
+ cent_crop_size: 224
19
+ scale_size: 224
20
+ color_jitter_threshold: 0.2
21
+ temporal_augmentation:
22
+ tmin: 0.5
23
+ tmax: 1.5
24
+ testing:
25
+ cfg:
26
+ recognition:
27
+ beam_size: 5
28
+ training:
29
+ overwrite: false
30
+ model_dir: experiments/outputs/SingleStream/vsl_s2g
31
+ shuffle: true
32
+ batch_size: 4
33
+ total_epoch: 100
34
+ keep_last_ckpts: 5
35
+ validation:
36
+ unit: epoch
37
+ freq: 1
38
+ cfg:
39
+ recognition:
40
+ beam_size: 2
41
+ optimization:
42
+ learning_rate:
43
+ default: 4.0e-3
44
+ optimizer: sgd
45
+ weight_decay: 1.0e-3
46
+ momentum: 0.9
47
+ betas:
48
+ - 0.9
49
+ - 0.998
50
+ scheduler: cosineannealing
51
+ t_max: 50
52
+ model:
53
+ RecognitionNetwork:
54
+ GlossTokenizer:
55
+ gloss2id_file: pretrained/mBart_vi/gloss2ids.pkl
56
+ s3d:
57
+ pretrained_ckpt: pretrained/s3ds_actioncls
58
+ use_block: 4
59
+ freeze_block: 1
60
+ visual_head:
61
+ input_size: 832
62
+ hidden_size: 512
63
+ ff_size: 2048
64
+ pe: True
65
+ ff_kernelsize:
66
+ - 3
67
+ - 3