MODEL: NAME: unicl_swin_tiny DIM_PROJECTION: 512 IMAGE_ENCODER: TYPE: swin DROP_PATH_RATE: 0.2 SWIN: EMBED_DIM: 96 DEPTHS: [ 2, 2, 6, 2 ] NUM_HEADS: [ 3, 6, 12, 24 ] WINDOW_SIZE: 7 TEXT_ENCODER: NAME: 'transformer' WIDTH: 512 HEADS: 8 LAYERS: 12