{ "ee_args": { "desc_input_feature_size": 512, "desc_model_is_bidirectional": true, "desc_output_feature_size": 32, "roomModelArgs": { "out_channels": 128, "scene_in_channels": 512 }, "scenesSequenceModelArgs": { "feature_size": 32, "in_channels": 128, "kernel_size": 3, "out_channels": 64 }, "useLSTM": false }, "strategy_name": "hier_by_room_rnn_meanPoolProc_cnn1d", "transformers_version": "4.34.0", "uses_audio_video_features": null, "uses_flattened_hierarchy": false }