tanthinhdt commited on
Commit
fd29ef8
1 Parent(s): 9eccd73

Upload wlasl300_s2g-2024-02-28_11-59-38/wlasl300_s2g.yaml with huggingface_hub

Browse files
wlasl300_s2g-2024-02-28_11-59-38/wlasl300_s2g.yaml ADDED
@@ -0,0 +1,69 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ task: S2G
2
+ data:
3
+ name: wlasl300
4
+ subset: rgb_videos
5
+ num_proc: 2
6
+ cache_dir: data/external/huggingface
7
+ input_streams:
8
+ - rgb
9
+ level: word #word or char
10
+ txt_lowercase: true
11
+ max_sent_length: 400
12
+ transform_cfg:
13
+ rand_crop_size: 224
14
+ rand_crop_threshold: 0.7
15
+ rand_crop_bottom_area: 0.7
16
+ rand_crop_aspect_ratio_min: 0.75
17
+ rand_crop_aspect_ratio_max: 1.3
18
+ cent_crop_size: 224
19
+ scale_size: 224
20
+ color_jitter_threshold: 0.2
21
+ temporal_augmentation:
22
+ tmin: 0.5
23
+ tmax: 1.5
24
+ testing:
25
+ cfg:
26
+ recognition:
27
+ beam_size: 5
28
+ training:
29
+ from_ckpt: false
30
+ from_best: false
31
+ overwrite: true
32
+ model_dir: experiments/outputs/SingleStream/wlasl300_s2g
33
+ shuffle: true
34
+ batch_size: 3
35
+ total_epoch: 50
36
+ keep_last_ckpts: 5
37
+ validation:
38
+ unit: epoch
39
+ freq: 1
40
+ cfg:
41
+ recognition:
42
+ beam_size: 2
43
+ optimization:
44
+ learning_rate:
45
+ default: 2.0e-3
46
+ optimizer: sgd
47
+ weight_decay: 1.0e-3
48
+ momentum: 0.9
49
+ betas:
50
+ - 0.9
51
+ - 0.998
52
+ scheduler: cosineannealing
53
+ t_max: 50
54
+ model:
55
+ RecognitionNetwork:
56
+ GlossTokenizer:
57
+ gloss2id_file: pretrained/mBart_en/gloss2ids.pkl
58
+ s3d:
59
+ pretrained_ckpt: pretrained/s3ds_actioncls
60
+ use_block: 4
61
+ freeze_block: 1
62
+ visual_head:
63
+ input_size: 832
64
+ hidden_size: 512
65
+ ff_size: 2048
66
+ pe: True
67
+ ff_kernelsize:
68
+ - 3
69
+ - 3