+ echo Logging output to /data_2/output/LM/lcvlm_modellink/scripts/qwen25/finetune_qwen25_14b_intern_300m_ptd_tp8pp1_stage2.sh/20241014_131952//log_node9.txt Logging output to /data_2/output/LM/lcvlm_modellink/scripts/qwen25/finetune_qwen25_14b_intern_300m_ptd_tp8pp1_stage2.sh/20241014_131952//log_node9.txt + export ASCEND_PROCESS_LOG_PATH=/data_2/output/LM/lcvlm_modellink/scripts/qwen25/finetune_qwen25_14b_intern_300m_ptd_tp8pp1_stage2.sh/20241014_131952//ascend/9 + ASCEND_PROCESS_LOG_PATH=/data_2/output/LM/lcvlm_modellink/scripts/qwen25/finetune_qwen25_14b_intern_300m_ptd_tp8pp1_stage2.sh/20241014_131952//ascend/9 + mkdir -p /data_2/output/LM/lcvlm_modellink/scripts/qwen25/finetune_qwen25_14b_intern_300m_ptd_tp8pp1_stage2.sh/20241014_131952//ascend/9 + DATA_PATH=/local_disk/cognitron_vl//configs/lcvlm_finetune_stage2.yaml + TOKENIZER_PATH=/data_4/models/Qwen/Qwen2.5-14B-Instruct/ + CKPT_LOAD_DIR=/data_2/output/LM/lcvlm_modellink/scripts/qwen25/pretrain_qwen25_14b_intern_300m_ptd_tp8pp1_stage1.sh/20241012_095536/ + VIT_CKPT_LOAD_DIR=/ + CKPT_SAVE_DIR=/data_2/output/LM/lcvlm_modellink/scripts/qwen25/finetune_qwen25_14b_intern_300m_ptd_tp8pp1_stage2.sh/20241014_131952// + rsync -avh /local_disk/cognitron_vl//configs/lcvlm_finetune_stage2.yaml /data_2/output/LM/lcvlm_modellink/scripts/qwen25/finetune_qwen25_14b_intern_300m_ptd_tp8pp1_stage2.sh/20241014_131952/ sending incremental file list sent 59 bytes received 12 bytes 142.00 bytes/sec total size is 18.03K speedup is 254.00 + cd /local_disk/cognitron_vl/ + rm -fr datasets + mkdir -p datasets + ln -s /data/data/ datasets/ + source /local_disk/cognitron_vl//scripts/set_env_mg_npu.sh ++ source /usr/local/Ascend/driver/bin/setenv.bash +++ DEP_INFO_FILE=/etc/ascend_install.info +++ [[ -f /etc/ascend_install.info ]] ++ source /usr/local/Ascend/ascend-toolkit/set_env.sh +++ export ASCEND_TOOLKIT_HOME=/usr/local/Ascend/ascend-toolkit/latest +++ ASCEND_TOOLKIT_HOME=/usr/local/Ascend/ascend-toolkit/latest ++++ arch +++ export LD_LIBRARY_PATH=/usr/local/Ascend/ascend-toolkit/latest/lib64:/usr/local/Ascend/ascend-toolkit/latest/lib64/plugin/opskernel:/usr/local/Ascend/ascend-toolkit/latest/lib64/plugin/nnengine:/usr/local/Ascend/ascend-toolkit/latest/opp/built-in/op_impl/ai_core/tbe/op_tiling/lib/linux/x86_64:/usr/local/openmpi/lib:/usr/local/Ascend/driver/lib64/common:/usr/local/Ascend/driver/lib64/driver:/usr/local/Ascend/ascend-toolkit/latest/tools/aml/lib64:/usr/local/Ascend/ascend-toolkit/latest/tools/aml/lib64/plugin:/usr/local/Ascend/ascend-toolkit/latest/lib64:/usr/local/Ascend/ascend-toolkit/latest/lib64/plugin/opskernel:/usr/local/Ascend/ascend-toolkit/latest/lib64/plugin/nnengine:/usr/local/Ascend/ascend-toolkit/latest/opp/built-in/op_impl/ai_core/tbe/op_tiling/lib/linux/x86_64:/usr/local/Ascend/ascend-toolkit/latest/lib64:/usr/local/Ascend/driver/lib64:/usr/local/Ascend/driver/lib64/common:/usr/local/Ascend/driver/lib64/driver:/usr/local/Ascend/driver/tools/hccn_tool/:/opp/built-in/op_impl/ai_core/tbe/op_tiling/lib/linux/x86_64/:/usr/lib/x86_64-linux-gnu/hdf5/serial:/usr/local/python3.7.5/lib: +++ LD_LIBRARY_PATH=/usr/local/Ascend/ascend-toolkit/latest/lib64:/usr/local/Ascend/ascend-toolkit/latest/lib64/plugin/opskernel:/usr/local/Ascend/ascend-toolkit/latest/lib64/plugin/nnengine:/usr/local/Ascend/ascend-toolkit/latest/opp/built-in/op_impl/ai_core/tbe/op_tiling/lib/linux/x86_64:/usr/local/openmpi/lib:/usr/local/Ascend/driver/lib64/common:/usr/local/Ascend/driver/lib64/driver:/usr/local/Ascend/ascend-toolkit/latest/tools/aml/lib64:/usr/local/Ascend/ascend-toolkit/latest/tools/aml/lib64/plugin:/usr/local/Ascend/ascend-toolkit/latest/lib64:/usr/local/Ascend/ascend-toolkit/latest/lib64/plugin/opskernel:/usr/local/Ascend/ascend-toolkit/latest/lib64/plugin/nnengine:/usr/local/Ascend/ascend-toolkit/latest/opp/built-in/op_impl/ai_core/tbe/op_tiling/lib/linux/x86_64:/usr/local/Ascend/ascend-toolkit/latest/lib64:/usr/local/Ascend/driver/lib64:/usr/local/Ascend/driver/lib64/common:/usr/local/Ascend/driver/lib64/driver:/usr/local/Ascend/driver/tools/hccn_tool/:/opp/built-in/op_impl/ai_core/tbe/op_tiling/lib/linux/x86_64/:/usr/lib/x86_64-linux-gnu/hdf5/serial:/usr/local/python3.7.5/lib: +++ export LD_LIBRARY_PATH=/usr/local/Ascend/ascend-toolkit/latest/tools/aml/lib64:/usr/local/Ascend/ascend-toolkit/latest/tools/aml/lib64/plugin:/usr/local/Ascend/ascend-toolkit/latest/lib64:/usr/local/Ascend/ascend-toolkit/latest/lib64/plugin/opskernel:/usr/local/Ascend/ascend-toolkit/latest/lib64/plugin/nnengine:/usr/local/Ascend/ascend-toolkit/latest/opp/built-in/op_impl/ai_core/tbe/op_tiling/lib/linux/x86_64:/usr/local/openmpi/lib:/usr/local/Ascend/driver/lib64/common:/usr/local/Ascend/driver/lib64/driver:/usr/local/Ascend/ascend-toolkit/latest/tools/aml/lib64:/usr/local/Ascend/ascend-toolkit/latest/tools/aml/lib64/plugin:/usr/local/Ascend/ascend-toolkit/latest/lib64:/usr/local/Ascend/ascend-toolkit/latest/lib64/plugin/opskernel:/usr/local/Ascend/ascend-toolkit/latest/lib64/plugin/nnengine:/usr/local/Ascend/ascend-toolkit/latest/opp/built-in/op_impl/ai_core/tbe/op_tiling/lib/linux/x86_64:/usr/local/Ascend/ascend-toolkit/latest/lib64:/usr/local/Ascend/driver/lib64:/usr/local/Ascend/driver/lib64/common:/usr/local/Ascend/driver/lib64/driver:/usr/local/Ascend/driver/tools/hccn_tool/:/opp/built-in/op_impl/ai_core/tbe/op_tiling/lib/linux/x86_64/:/usr/lib/x86_64-linux-gnu/hdf5/serial:/usr/local/python3.7.5/lib: +++ LD_LIBRARY_PATH=/usr/local/Ascend/ascend-toolkit/latest/tools/aml/lib64:/usr/local/Ascend/ascend-toolkit/latest/tools/aml/lib64/plugin:/usr/local/Ascend/ascend-toolkit/latest/lib64:/usr/local/Ascend/ascend-toolkit/latest/lib64/plugin/opskernel:/usr/local/Ascend/ascend-toolkit/latest/lib64/plugin/nnengine:/usr/local/Ascend/ascend-toolkit/latest/opp/built-in/op_impl/ai_core/tbe/op_tiling/lib/linux/x86_64:/usr/local/openmpi/lib:/usr/local/Ascend/driver/lib64/common:/usr/local/Ascend/driver/lib64/driver:/usr/local/Ascend/ascend-toolkit/latest/tools/aml/lib64:/usr/local/Ascend/ascend-toolkit/latest/tools/aml/lib64/plugin:/usr/local/Ascend/ascend-toolkit/latest/lib64:/usr/local/Ascend/ascend-toolkit/latest/lib64/plugin/opskernel:/usr/local/Ascend/ascend-toolkit/latest/lib64/plugin/nnengine:/usr/local/Ascend/ascend-toolkit/latest/opp/built-in/op_impl/ai_core/tbe/op_tiling/lib/linux/x86_64:/usr/local/Ascend/ascend-toolkit/latest/lib64:/usr/local/Ascend/driver/lib64:/usr/local/Ascend/driver/lib64/common:/usr/local/Ascend/driver/lib64/driver:/usr/local/Ascend/driver/tools/hccn_tool/:/opp/built-in/op_impl/ai_core/tbe/op_tiling/lib/linux/x86_64/:/usr/lib/x86_64-linux-gnu/hdf5/serial:/usr/local/python3.7.5/lib: +++ export PYTHONPATH=/usr/local/Ascend/ascend-toolkit/latest/python/site-packages:/usr/local/Ascend/ascend-toolkit/latest/opp/built-in/op_impl/ai_core/tbe:/usr/local/Ascend/ascend-toolkit/latest/python/site-packages:/usr/local/Ascend/ascend-toolkit/latest/opp/built-in/op_impl/ai_core/tbe:/usr/local/Ascend/ascend-toolkit/latest/opp/op_impl/built-in/ai_core/tbe: +++ PYTHONPATH=/usr/local/Ascend/ascend-toolkit/latest/python/site-packages:/usr/local/Ascend/ascend-toolkit/latest/opp/built-in/op_impl/ai_core/tbe:/usr/local/Ascend/ascend-toolkit/latest/python/site-packages:/usr/local/Ascend/ascend-toolkit/latest/opp/built-in/op_impl/ai_core/tbe:/usr/local/Ascend/ascend-toolkit/latest/opp/op_impl/built-in/ai_core/tbe: +++ export PATH=/usr/local/Ascend/ascend-toolkit/latest/bin:/usr/local/Ascend/ascend-toolkit/latest/compiler/ccec_compiler/bin:/usr/local/Ascend/ascend-toolkit/latest/tools/ccec_compiler/bin:/usr/local/openmpi/bin:/usr/local/Ascend/driver/tools:/usr/local/Ascend/ascend-toolkit/latest/bin:/usr/local/Ascend/ascend-toolkit/latest/compiler/ccec_compiler/bin:/usr/local/Ascend/ascend-toolkit/latest/tools/ccec_compiler/bin:/root/miniconda3/envs/torch21_python38/bin:/root/miniconda3/condabin:/usr/local/Ascend/ascend-toolkit/latest/ccec_compiler/bin:/usr/local/python3.7.5/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin +++ PATH=/usr/local/Ascend/ascend-toolkit/latest/bin:/usr/local/Ascend/ascend-toolkit/latest/compiler/ccec_compiler/bin:/usr/local/Ascend/ascend-toolkit/latest/tools/ccec_compiler/bin:/usr/local/openmpi/bin:/usr/local/Ascend/driver/tools:/usr/local/Ascend/ascend-toolkit/latest/bin:/usr/local/Ascend/ascend-toolkit/latest/compiler/ccec_compiler/bin:/usr/local/Ascend/ascend-toolkit/latest/tools/ccec_compiler/bin:/root/miniconda3/envs/torch21_python38/bin:/root/miniconda3/condabin:/usr/local/Ascend/ascend-toolkit/latest/ccec_compiler/bin:/usr/local/python3.7.5/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin +++ export ASCEND_AICPU_PATH=/usr/local/Ascend/ascend-toolkit/latest +++ ASCEND_AICPU_PATH=/usr/local/Ascend/ascend-toolkit/latest +++ export ASCEND_OPP_PATH=/usr/local/Ascend/ascend-toolkit/latest/opp +++ ASCEND_OPP_PATH=/usr/local/Ascend/ascend-toolkit/latest/opp +++ export TOOLCHAIN_HOME=/usr/local/Ascend/ascend-toolkit/latest/toolkit +++ TOOLCHAIN_HOME=/usr/local/Ascend/ascend-toolkit/latest/toolkit +++ export ASCEND_HOME_PATH=/usr/local/Ascend/ascend-toolkit/latest +++ ASCEND_HOME_PATH=/usr/local/Ascend/ascend-toolkit/latest ++ export HCCL_CONNECT_TIMEOUT=7200 ++ HCCL_CONNECT_TIMEOUT=7200 ++ export HCCL_EXEC_TIMEOUT=7200 ++ HCCL_EXEC_TIMEOUT=7200 ++ export COMBINED_ENABLE=1 ++ COMBINED_ENABLE=1 ++ export MULTI_STREAM_MEMORY_REUSE=1 ++ MULTI_STREAM_MEMORY_REUSE=1 ++ export HCCL_RDMA_TC=160 ++ HCCL_RDMA_TC=160 ++ export HCCL_RDMA_SL=5 ++ HCCL_RDMA_SL=5 ++ export HCCL_INTRA_PCIE_ENABLE=0 ++ HCCL_INTRA_PCIE_ENABLE=0 ++ export HCCL_INTRA_ROCE_ENABLE=1 ++ HCCL_INTRA_ROCE_ENABLE=1 ++ export HCCL_RDMA_TIMEOUT=20 ++ HCCL_RDMA_TIMEOUT=20 ++ export INF_NAN_MODE_ENABLE=1 ++ INF_NAN_MODE_ENABLE=1 ++ export DISTRIBUTED_BACKEND=hccl ++ DISTRIBUTED_BACKEND=hccl ++ export ASCEND_LAUNCH_BLOCKING=0 ++ ASCEND_LAUNCH_BLOCKING=0 ++ export ASCEND_SLOG_PRINT_TO_STDOUT=0 ++ ASCEND_SLOG_PRINT_TO_STDOUT=0 ++ export ASCEND_GLOBAL_LOG_LEVEL=3 ++ ASCEND_GLOBAL_LOG_LEVEL=3 ++ export ASCEND_GLOBAL_EVENT_ENABLE=0 ++ ASCEND_GLOBAL_EVENT_ENABLE=0 ++ export TASK_QUEUE_ENABLE=1 ++ TASK_QUEUE_ENABLE=1 ++ export PTCOPY_ENABLE=1 ++ PTCOPY_ENABLE=1 ++ export COMBINED_ENABLE=1 ++ COMBINED_ENABLE=1 ++ export DYNAMIC_OP=ADD#MUL ++ DYNAMIC_OP=ADD#MUL ++ export HCCL_WHITELIST_DISABLE=1 ++ HCCL_WHITELIST_DISABLE=1 ++ export HCCL_CONNECT_TIMEOUT=7200 ++ HCCL_CONNECT_TIMEOUT=7200 ++ export HCCL_WHITELIST_DISABLE=1 ++ HCCL_WHITELIST_DISABLE=1 ++ export CUDA_DEVICE_MAX_CONNECTIONS=1 ++ CUDA_DEVICE_MAX_CONNECTIONS=1 ++ rm -fr /usr/local/python3.7.5/bin/ ++ apt-get install -y libaio-dev Reading package lists... Building dependency tree... Reading state information... The following additional packages will be installed: libaio1 The following NEW packages will be installed: libaio-dev libaio1 0 upgraded, 2 newly installed, 0 to remove and 55 not upgraded. Need to get 19.3 kB of archives. After this operation, 87.0 kB of additional disk space will be used. Get:1 http://mirrors.tencentyun.com/ubuntu bionic-updates/main amd64 libaio1 amd64 0.3.110-5ubuntu0.1 [6,476 B] Get:2 http://mirrors.tencentyun.com/ubuntu bionic-updates/main amd64 libaio-dev amd64 0.3.110-5ubuntu0.1 [12.8 kB] debconf: delaying package configuration, since apt-utils is not installed Fetched 19.3 kB in 0s (670 kB/s) Selecting previously unselected package libaio1:amd64. (Reading database ... (Reading database ... 5% (Reading database ... 10% (Reading database ... 15% (Reading database ... 20% (Reading database ... 25% (Reading database ... 30% (Reading database ... 35% (Reading database ... 40% (Reading database ... 45% (Reading database ... 50% (Reading database ... 55% (Reading database ... 60% (Reading database ... 65% (Reading database ... 70% (Reading database ... 75% (Reading database ... 80% (Reading database ... 85% (Reading database ... 90% (Reading database ... 95% (Reading database ... 100% (Reading database ... 21494 files and directories currently installed.) Preparing to unpack .../libaio1_0.3.110-5ubuntu0.1_amd64.deb ... Unpacking libaio1:amd64 (0.3.110-5ubuntu0.1) ... Selecting previously unselected package libaio-dev:amd64. Preparing to unpack .../libaio-dev_0.3.110-5ubuntu0.1_amd64.deb ... Unpacking libaio-dev:amd64 (0.3.110-5ubuntu0.1) ... Processing triggers for libc-bin (2.27-3ubuntu1) ... /sbin/ldconfig.real: File /usr/lib/x86_64-linux-gnu/libnvidia-cfg.so.1 is empty, not checked. /sbin/ldconfig.real: File /usr/lib/x86_64-linux-gnu/libcudadebugger.so.1 is empty, not checked. /sbin/ldconfig.real: File /usr/lib/x86_64-linux-gnu/libnvidia-ptxjitcompiler.so.1 is empty, not checked. /sbin/ldconfig.real: File /usr/lib/x86_64-linux-gnu/libcuda.so is empty, not checked. /sbin/ldconfig.real: File /usr/lib/x86_64-linux-gnu/libcuda.so.535.54.04 is empty, not checked. /sbin/ldconfig.real: File /usr/lib/x86_64-linux-gnu/libnvidia-allocator.so.1 is empty, not checked. /sbin/ldconfig.real: File /usr/lib/x86_64-linux-gnu/libnvidia-cfg.so.535.54.04 is empty, not checked. /sbin/ldconfig.real: File /usr/lib/x86_64-linux-gnu/libnvidia-pkcs11.so.535.54.04 is empty, not checked. /sbin/ldconfig.real: File /usr/lib/x86_64-linux-gnu/libnvidia-opencl.so.1 is empty, not checked. /sbin/ldconfig.real: File /usr/lib/x86_64-linux-gnu/libnvidia-ml.so.535.54.04 is empty, not checked. /sbin/ldconfig.real: File /usr/lib/x86_64-linux-gnu/libnvidia-ml.so.1 is empty, not checked. /sbin/ldconfig.real: File /usr/lib/x86_64-linux-gnu/libcudadebugger.so.535.54.04 is empty, not checked. /sbin/ldconfig.real: File /usr/lib/x86_64-linux-gnu/libnvidia-ptxjitcompiler.so.535.54.04 is empty, not checked. /sbin/ldconfig.real: File /usr/lib/x86_64-linux-gnu/libcuda.so.1 is empty, not checked. /sbin/ldconfig.real: File /usr/lib/x86_64-linux-gnu/libnvidia-opencl.so.535.54.04 is empty, not checked. /sbin/ldconfig.real: File /usr/lib/x86_64-linux-gnu/libnvidia-allocator.so.535.54.04 is empty, not checked. /sbin/ldconfig.real: File /usr/lib/x86_64-linux-gnu/libnvidia-ptxjitcompiler.so.515.65.01 is empty, not checked. /sbin/ldconfig.real: File /usr/lib/x86_64-linux-gnu/libnvidia-opencl.so.515.65.01 is empty, not checked. /sbin/ldconfig.real: File /usr/lib/x86_64-linux-gnu/libnvidia-cfg.so.515.65.01 is empty, not checked. /sbin/ldconfig.real: File /usr/lib/x86_64-linux-gnu/libnvidia-ml.so.515.65.01 is empty, not checked. /sbin/ldconfig.real: File /usr/lib/x86_64-linux-gnu/libnvidia-nvvm.so.515.65.01 is empty, not checked. /sbin/ldconfig.real: File /usr/lib/x86_64-linux-gnu/libnvidia-nvvm.so.4 is empty, not checked. /sbin/ldconfig.real: File /usr/lib/x86_64-linux-gnu/libnvidia-compiler.so.515.65.01 is empty, not checked. /sbin/ldconfig.real: File /usr/lib/x86_64-linux-gnu/libnvidia-allocator.so.515.65.01 is empty, not checked. /sbin/ldconfig.real: File /usr/lib/x86_64-linux-gnu/libcuda.so.515.65.01 is empty, not checked. Setting up libaio1:amd64 (0.3.110-5ubuntu0.1) ... Setting up libaio-dev:amd64 (0.3.110-5ubuntu0.1) ... Processing triggers for libc-bin (2.27-3ubuntu1) ... /sbin/ldconfig.real: File /usr/lib/x86_64-linux-gnu/libnvidia-cfg.so.1 is empty, not checked. /sbin/ldconfig.real: File /usr/lib/x86_64-linux-gnu/libcudadebugger.so.1 is empty, not checked. /sbin/ldconfig.real: File /usr/lib/x86_64-linux-gnu/libnvidia-ptxjitcompiler.so.1 is empty, not checked. /sbin/ldconfig.real: File /usr/lib/x86_64-linux-gnu/libcuda.so is empty, not checked. /sbin/ldconfig.real: File /usr/lib/x86_64-linux-gnu/libcuda.so.535.54.04 is empty, not checked. /sbin/ldconfig.real: File /usr/lib/x86_64-linux-gnu/libnvidia-allocator.so.1 is empty, not checked. /sbin/ldconfig.real: File /usr/lib/x86_64-linux-gnu/libnvidia-cfg.so.535.54.04 is empty, not checked. /sbin/ldconfig.real: File /usr/lib/x86_64-linux-gnu/libnvidia-pkcs11.so.535.54.04 is empty, not checked. /sbin/ldconfig.real: File /usr/lib/x86_64-linux-gnu/libnvidia-opencl.so.1 is empty, not checked. /sbin/ldconfig.real: File /usr/lib/x86_64-linux-gnu/libnvidia-ml.so.535.54.04 is empty, not checked. /sbin/ldconfig.real: File /usr/lib/x86_64-linux-gnu/libnvidia-ml.so.1 is empty, not checked. /sbin/ldconfig.real: File /usr/lib/x86_64-linux-gnu/libcudadebugger.so.535.54.04 is empty, not checked. /sbin/ldconfig.real: File /usr/lib/x86_64-linux-gnu/libnvidia-ptxjitcompiler.so.535.54.04 is empty, not checked. /sbin/ldconfig.real: File /usr/lib/x86_64-linux-gnu/libcuda.so.1 is empty, not checked. /sbin/ldconfig.real: File /usr/lib/x86_64-linux-gnu/libnvidia-opencl.so.535.54.04 is empty, not checked. /sbin/ldconfig.real: File /usr/lib/x86_64-linux-gnu/libnvidia-allocator.so.535.54.04 is empty, not checked. /sbin/ldconfig.real: File /usr/lib/x86_64-linux-gnu/libnvidia-ptxjitcompiler.so.515.65.01 is empty, not checked. /sbin/ldconfig.real: File /usr/lib/x86_64-linux-gnu/libnvidia-opencl.so.515.65.01 is empty, not checked. /sbin/ldconfig.real: File /usr/lib/x86_64-linux-gnu/libnvidia-cfg.so.515.65.01 is empty, not checked. /sbin/ldconfig.real: File /usr/lib/x86_64-linux-gnu/libnvidia-ml.so.515.65.01 is empty, not checked. /sbin/ldconfig.real: File /usr/lib/x86_64-linux-gnu/libnvidia-nvvm.so.515.65.01 is empty, not checked. /sbin/ldconfig.real: File /usr/lib/x86_64-linux-gnu/libnvidia-nvvm.so.4 is empty, not checked. /sbin/ldconfig.real: File /usr/lib/x86_64-linux-gnu/libnvidia-compiler.so.515.65.01 is empty, not checked. /sbin/ldconfig.real: File /usr/lib/x86_64-linux-gnu/libnvidia-allocator.so.515.65.01 is empty, not checked. /sbin/ldconfig.real: File /usr/lib/x86_64-linux-gnu/libcuda.so.515.65.01 is empty, not checked. ++ apt-get install -y python3-pybind11 Reading package lists... Building dependency tree... Reading state information... The following additional packages will be installed: pybind11-dev Suggested packages: libeigen3-dev pybind11-doc The following NEW packages will be installed: pybind11-dev python3-pybind11 0 upgraded, 2 newly installed, 0 to remove and 55 not upgraded. Need to get 77.4 kB of archives. After this operation, 427 kB of additional disk space will be used. Get:1 http://mirrors.tencentyun.com/ubuntu bionic/universe amd64 pybind11-dev all 2.0.1-4 [72.8 kB] Get:2 http://mirrors.tencentyun.com/ubuntu bionic/universe amd64 python3-pybind11 all 2.0.1-4 [4,652 B] debconf: delaying package configuration, since apt-utils is not installed Fetched 77.4 kB in 0s (2,575 kB/s) Selecting previously unselected package pybind11-dev. (Reading database ... (Reading database ... 5% (Reading database ... 10% (Reading database ... 15% (Reading database ... 20% (Reading database ... 25% (Reading database ... 30% (Reading database ... 35% (Reading database ... 40% (Reading database ... 45% (Reading database ... 50% (Reading database ... 55% (Reading database ... 60% (Reading database ... 65% (Reading database ... 70% (Reading database ... 75% (Reading database ... 80% (Reading database ... 85% (Reading database ... 90% (Reading database ... 95% (Reading database ... 100% (Reading database ... 21517 files and directories currently installed.) Preparing to unpack .../pybind11-dev_2.0.1-4_all.deb ... Unpacking pybind11-dev (2.0.1-4) ... Selecting previously unselected package python3-pybind11. Preparing to unpack .../python3-pybind11_2.0.1-4_all.deb ... Unpacking python3-pybind11 (2.0.1-4) ... Setting up pybind11-dev (2.0.1-4) ... Setting up python3-pybind11 (2.0.1-4) ... ++ apt-get install -y python3-dev Reading package lists... Building dependency tree... Reading state information... The following additional packages will be installed: dh-python libexpat1-dev libpython3-dev libpython3.6-dev python3-distutils python3-lib2to3 python3.6-dev The following NEW packages will be installed: dh-python libexpat1-dev libpython3-dev libpython3.6-dev python3-dev python3-distutils python3-lib2to3 python3.6-dev 0 upgraded, 8 newly installed, 0 to remove and 55 not upgraded. Need to get 45.8 MB of archives. After this operation, 81.5 MB of additional disk space will be used. Get:1 http://mirrors.tencentyun.com/ubuntu bionic-updates/main amd64 python3-lib2to3 all 3.6.9-1~18.04 [77.4 kB] Get:2 http://mirrors.tencentyun.com/ubuntu bionic-updates/main amd64 python3-distutils all 3.6.9-1~18.04 [144 kB] Get:3 http://mirrors.tencentyun.com/ubuntu bionic/main amd64 dh-python all 3.20180325ubuntu2 [89.2 kB] Get:4 http://mirrors.tencentyun.com/ubuntu bionic-updates/main amd64 libexpat1-dev amd64 2.2.5-3ubuntu0.9 [124 kB] Get:5 http://mirrors.tencentyun.com/ubuntu bionic-updates/main amd64 libpython3.6-dev amd64 3.6.9-1~18.04ubuntu1.12 [44.9 MB] Get:6 http://mirrors.tencentyun.com/ubuntu bionic-updates/main amd64 libpython3-dev amd64 3.6.7-1~18.04 [7,328 B] Get:7 http://mirrors.tencentyun.com/ubuntu bionic-updates/main amd64 python3.6-dev amd64 3.6.9-1~18.04ubuntu1.12 [511 kB] Get:8 http://mirrors.tencentyun.com/ubuntu bionic-updates/main amd64 python3-dev amd64 3.6.7-1~18.04 [1,288 B] debconf: delaying package configuration, since apt-utils is not installed Fetched 45.8 MB in 1s (70.1 MB/s) Selecting previously unselected package python3-lib2to3. (Reading database ... (Reading database ... 5% (Reading database ... 10% (Reading database ... 15% (Reading database ... 20% (Reading database ... 25% (Reading database ... 30% (Reading database ... 35% (Reading database ... 40% (Reading database ... 45% (Reading database ... 50% (Reading database ... 55% (Reading database ... 60% (Reading database ... 65% (Reading database ... 70% (Reading database ... 75% (Reading database ... 80% (Reading database ... 85% (Reading database ... 90% (Reading database ... 95% (Reading database ... 100% (Reading database ... 21555 files and directories currently installed.) Preparing to unpack .../0-python3-lib2to3_3.6.9-1~18.04_all.deb ... Unpacking python3-lib2to3 (3.6.9-1~18.04) ... Selecting previously unselected package python3-distutils. Preparing to unpack .../1-python3-distutils_3.6.9-1~18.04_all.deb ... Unpacking python3-distutils (3.6.9-1~18.04) ... Selecting previously unselected package dh-python. Preparing to unpack .../2-dh-python_3.20180325ubuntu2_all.deb ... Unpacking dh-python (3.20180325ubuntu2) ... Selecting previously unselected package libexpat1-dev:amd64. Preparing to unpack .../3-libexpat1-dev_2.2.5-3ubuntu0.9_amd64.deb ... Unpacking libexpat1-dev:amd64 (2.2.5-3ubuntu0.9) ... Selecting previously unselected package libpython3.6-dev:amd64. Preparing to unpack .../4-libpython3.6-dev_3.6.9-1~18.04ubuntu1.12_amd64.deb ... Unpacking libpython3.6-dev:amd64 (3.6.9-1~18.04ubuntu1.12) ... Selecting previously unselected package libpython3-dev:amd64. Preparing to unpack .../5-libpython3-dev_3.6.7-1~18.04_amd64.deb ... Unpacking libpython3-dev:amd64 (3.6.7-1~18.04) ... Selecting previously unselected package python3.6-dev. Preparing to unpack .../6-python3.6-dev_3.6.9-1~18.04ubuntu1.12_amd64.deb ... Unpacking python3.6-dev (3.6.9-1~18.04ubuntu1.12) ... Selecting previously unselected package python3-dev. Preparing to unpack .../7-python3-dev_3.6.7-1~18.04_amd64.deb ... Unpacking python3-dev (3.6.7-1~18.04) ... Setting up libexpat1-dev:amd64 (2.2.5-3ubuntu0.9) ... Setting up python3-lib2to3 (3.6.9-1~18.04) ... Setting up python3-distutils (3.6.9-1~18.04) ... Setting up libpython3.6-dev:amd64 (3.6.9-1~18.04ubuntu1.12) ... Setting up python3.6-dev (3.6.9-1~18.04ubuntu1.12) ... Setting up dh-python (3.20180325ubuntu2) ... Setting up libpython3-dev:amd64 (3.6.7-1~18.04) ... Setting up python3-dev (3.6.7-1~18.04) ... ++ '[' -f /usr/local/bin/python3.9 ']' ++ pip3 uninstall -y deepspeed_npu WARNING: Skipping deepspeed_npu as it is not installed. WARNING: Running pip as the 'root' user can result in broken permissions and conflicting behaviour with the system package manager. It is recommended to use a virtual environment instead: https://pip.pypa.io/warnings/venv ++ pip3 uninstall -y deepspeed Found existing installation: deepspeed 0.9.2 Uninstalling deepspeed-0.9.2: Successfully uninstalled deepspeed-0.9.2 WARNING: Running pip as the 'root' user can result in broken permissions and conflicting behaviour with the system package manager. It is recommended to use a virtual environment instead: https://pip.pypa.io/warnings/venv ++ pip3 uninstall -y torch_npu WARNING: Skipping torch_npu as it is not installed. WARNING: Running pip as the 'root' user can result in broken permissions and conflicting behaviour with the system package manager. It is recommended to use a virtual environment instead: https://pip.pypa.io/warnings/venv ++ pip3 uninstall -y torch Found existing installation: torch 2.1.0+cpu Uninstalling torch-2.1.0+cpu: Successfully uninstalled torch-2.1.0+cpu WARNING: Running pip as the 'root' user can result in broken permissions and conflicting behaviour with the system package manager. It is recommended to use a virtual environment instead: https://pip.pypa.io/warnings/venv ++ pip3 install --no-index --find-links=/data/software/ torch==2.1.0 torchvision==0.16.0 torch_npu==2.1.0.post6 Looking in links: /data/software/ Processing data/software/torch-2.1.0+cpu-cp38-cp38-linux_x86_64.whl Requirement already satisfied: torchvision==0.16.0 in /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages (0.16.0) Processing data/software/torch_npu-2.1.0.post6-cp38-cp38-manylinux_2_17_x86_64.manylinux2014_x86_64.whl Requirement already satisfied: filelock in /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages (from torch==2.1.0) (3.13.1) Requirement already satisfied: typing-extensions in /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages (from torch==2.1.0) (4.9.0) Requirement already satisfied: sympy in /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages (from torch==2.1.0) (1.12) Requirement already satisfied: networkx in /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages (from torch==2.1.0) (3.1) Requirement already satisfied: jinja2 in /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages (from torch==2.1.0) (3.1.2) Requirement already satisfied: fsspec in /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages (from torch==2.1.0) (2023.10.0) Requirement already satisfied: numpy in /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages (from torchvision==0.16.0) (1.24.4) Requirement already satisfied: requests in /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages (from torchvision==0.16.0) (2.31.0) Requirement already satisfied: pillow!=8.3.*,>=5.3.0 in /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages (from torchvision==0.16.0) (10.2.0) Requirement already satisfied: MarkupSafe>=2.0 in /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages (from jinja2->torch==2.1.0) (2.1.3) Requirement already satisfied: charset-normalizer<4,>=2 in /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages (from requests->torchvision==0.16.0) (3.3.2) Requirement already satisfied: idna<4,>=2.5 in /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages (from requests->torchvision==0.16.0) (3.6) Requirement already satisfied: urllib3<3,>=1.21.1 in /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages (from requests->torchvision==0.16.0) (2.1.0) Requirement already satisfied: certifi>=2017.4.17 in /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages (from requests->torchvision==0.16.0) (2023.11.17) Requirement already satisfied: mpmath>=0.19 in /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages (from sympy->torch==2.1.0) (1.3.0) DEPRECATION: apex 0.1-ascend-20231124 has a non-standard version number. pip 24.0 will enforce this behaviour change. A possible replacement is to upgrade to a newer version of apex or contact the author to suggest that they release a version with a conforming version number. Discussion can be found at https://github.com/pypa/pip/issues/12063 Installing collected packages: torch, torch_npu Successfully installed torch-2.1.0+cpu torch_npu-2.1.0.post6 WARNING: Running pip as the 'root' user can result in broken permissions and conflicting behaviour with the system package manager. It is recommended to use a virtual environment instead: https://pip.pypa.io/warnings/venv ++ pip3 install --no-index --find-links=/data/software/ -r requirements.txt Looking in links: /data/software/ Requirement already satisfied: expecttest in /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages (from -r requirements.txt (line 1)) (0.2.1) Requirement already satisfied: peft in /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages (from -r requirements.txt (line 2)) (0.5.0) Processing data/software/XlsxWriter-3.2.0-py3-none-any.whl (from -r requirements.txt (line 3)) Processing data/software/termcolor-2.4.0-py3-none-any.whl (from -r requirements.txt (line 4)) Processing data/software/tabulate-0.9.0-py3-none-any.whl (from -r requirements.txt (line 5)) Requirement already satisfied: tiktoken in /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages (from -r requirements.txt (line 6)) (0.5.2) Requirement already satisfied: matplotlib in /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages (from -r requirements.txt (line 7)) (3.7.4) Processing data/software/datasets-2.21.0-py3-none-any.whl (from -r requirements.txt (line 8)) Requirement already satisfied: einops in /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages (from -r requirements.txt (line 9)) (0.6.1) Requirement already satisfied: pybind11 in /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages (from -r requirements.txt (line 10)) (2.11.1) Requirement already satisfied: tensorboardX in /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages (from -r requirements.txt (line 11)) (2.6.2.2) Processing data/software/pyarrow-16.1.0-cp38-cp38-manylinux_2_17_x86_64.manylinux2014_x86_64.whl (from -r requirements.txt (line 12)) Processing data/software/transformers-4.40.1-py3-none-any.whl (from -r requirements.txt (line 13)) Processing data/software/deepspeed-0.14.2.tar.gz (from -r requirements.txt (line 14)) Preparing metadata (setup.py): started Preparing metadata (setup.py): finished with status 'done' Processing data/software/accelerate-0.29.3-py3-none-any.whl (from -r requirements.txt (line 15)) Processing data/software/timm-1.0.7-py3-none-any.whl (from -r requirements.txt (line 16)) Processing data/software/flask-3.0.3-py3-none-any.whl (from -r requirements.txt (line 17)) Processing data/software/Flask_RESTful-0.3.10-py2.py3-none-any.whl (from -r requirements.txt (line 18)) Processing data/software/decord-0.6.0-py3-none-manylinux2010_x86_64.whl (from -r requirements.txt (line 19)) Processing data/software/natsort-8.4.0-py3-none-any.whl (from -r requirements.txt (line 20)) Requirement already satisfied: filelock in /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages (from datasets==2.21.0->-r requirements.txt (line 8)) (3.13.1) Requirement already satisfied: numpy>=1.17 in /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages (from datasets==2.21.0->-r requirements.txt (line 8)) (1.24.4) Requirement already satisfied: dill<0.3.9,>=0.3.0 in /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages (from datasets==2.21.0->-r requirements.txt (line 8)) (0.3.7) Requirement already satisfied: pandas in /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages (from datasets==2.21.0->-r requirements.txt (line 8)) (2.0.3) Processing data/software/requests-2.32.3-py3-none-any.whl (from datasets==2.21.0->-r requirements.txt (line 8)) Processing data/software/tqdm-4.66.5-py3-none-any.whl (from datasets==2.21.0->-r requirements.txt (line 8)) Requirement already satisfied: xxhash in /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages (from datasets==2.21.0->-r requirements.txt (line 8)) (3.4.1) Requirement already satisfied: multiprocess in /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages (from datasets==2.21.0->-r requirements.txt (line 8)) (0.70.15) Requirement already satisfied: fsspec<=2024.6.1,>=2023.1.0 in /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages (from fsspec[http]<=2024.6.1,>=2023.1.0->datasets==2.21.0->-r requirements.txt (line 8)) (2023.10.0) Requirement already satisfied: aiohttp in /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages (from datasets==2.21.0->-r requirements.txt (line 8)) (3.9.1) Processing data/software/huggingface_hub-0.25.2-py3-none-any.whl (from datasets==2.21.0->-r requirements.txt (line 8)) Requirement already satisfied: packaging in /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages (from datasets==2.21.0->-r requirements.txt (line 8)) (23.2) Requirement already satisfied: pyyaml>=5.1 in /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages (from datasets==2.21.0->-r requirements.txt (line 8)) (6.0.1) Requirement already satisfied: regex!=2019.12.17 in /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages (from transformers==4.40.1->-r requirements.txt (line 13)) (2023.12.25) Processing data/software/tokenizers-0.19.1-cp38-cp38-manylinux_2_17_x86_64.manylinux2014_x86_64.whl (from transformers==4.40.1->-r requirements.txt (line 13)) Requirement already satisfied: safetensors>=0.4.1 in /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages (from transformers==4.40.1->-r requirements.txt (line 13)) (0.4.1) Requirement already satisfied: hjson in /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages (from deepspeed==0.14.2->-r requirements.txt (line 14)) (3.1.0) Requirement already satisfied: ninja in /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages (from deepspeed==0.14.2->-r requirements.txt (line 14)) (1.11.1.1) Requirement already satisfied: psutil in /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages (from deepspeed==0.14.2->-r requirements.txt (line 14)) (5.9.7) Requirement already satisfied: py-cpuinfo in /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages (from deepspeed==0.14.2->-r requirements.txt (line 14)) (9.0.0) Requirement already satisfied: pydantic in /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages (from deepspeed==0.14.2->-r requirements.txt (line 14)) (1.10.13) Processing data/software/pynvml-11.5.0-py3-none-any.whl (from deepspeed==0.14.2->-r requirements.txt (line 14)) Requirement already satisfied: torch in /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages (from deepspeed==0.14.2->-r requirements.txt (line 14)) (2.1.0+cpu) Requirement already satisfied: contourpy>=1.0.1 in /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages (from matplotlib->-r requirements.txt (line 7)) (1.1.1) Requirement already satisfied: cycler>=0.10 in /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages (from matplotlib->-r requirements.txt (line 7)) (0.12.1) Requirement already satisfied: fonttools>=4.22.0 in /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages (from matplotlib->-r requirements.txt (line 7)) (4.47.2) Requirement already satisfied: kiwisolver>=1.0.1 in /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages (from matplotlib->-r requirements.txt (line 7)) (1.4.5) Requirement already satisfied: pillow>=6.2.0 in /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages (from matplotlib->-r requirements.txt (line 7)) (10.2.0) Requirement already satisfied: pyparsing>=2.3.1 in /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages (from matplotlib->-r requirements.txt (line 7)) (3.1.1) Requirement already satisfied: python-dateutil>=2.7 in /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages (from matplotlib->-r requirements.txt (line 7)) (2.8.2) Requirement already satisfied: importlib-resources>=3.2.0 in /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages (from matplotlib->-r requirements.txt (line 7)) (6.1.1) Requirement already satisfied: protobuf>=3.20 in /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages (from tensorboardX->-r requirements.txt (line 11)) (3.20.3) Requirement already satisfied: torchvision in /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages (from timm->-r requirements.txt (line 16)) (0.16.0) Requirement already satisfied: Werkzeug>=3.0.0 in /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages (from flask->-r requirements.txt (line 17)) (3.0.1) Requirement already satisfied: Jinja2>=3.1.2 in /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages (from flask->-r requirements.txt (line 17)) (3.1.2) Processing data/software/itsdangerous-2.2.0-py3-none-any.whl (from flask->-r requirements.txt (line 17)) Requirement already satisfied: click>=8.1.3 in /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages (from flask->-r requirements.txt (line 17)) (8.1.7) Processing data/software/blinker-1.8.2-py3-none-any.whl (from flask->-r requirements.txt (line 17)) Requirement already satisfied: importlib-metadata>=3.6.0 in /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages (from flask->-r requirements.txt (line 17)) (7.0.1) Processing data/software/aniso8601-9.0.1-py2.py3-none-any.whl (from flask_restful->-r requirements.txt (line 18)) Requirement already satisfied: six>=1.3.0 in /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages (from flask_restful->-r requirements.txt (line 18)) (1.16.0) Requirement already satisfied: pytz in /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages (from flask_restful->-r requirements.txt (line 18)) (2023.3.post1) Requirement already satisfied: attrs>=17.3.0 in /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages (from aiohttp->datasets==2.21.0->-r requirements.txt (line 8)) (23.2.0) Requirement already satisfied: multidict<7.0,>=4.5 in /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages (from aiohttp->datasets==2.21.0->-r requirements.txt (line 8)) (6.0.4) Requirement already satisfied: yarl<2.0,>=1.0 in /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages (from aiohttp->datasets==2.21.0->-r requirements.txt (line 8)) (1.9.4) Requirement already satisfied: frozenlist>=1.1.1 in /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages (from aiohttp->datasets==2.21.0->-r requirements.txt (line 8)) (1.4.1) Requirement already satisfied: aiosignal>=1.1.2 in /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages (from aiohttp->datasets==2.21.0->-r requirements.txt (line 8)) (1.3.1) Requirement already satisfied: async-timeout<5.0,>=4.0 in /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages (from aiohttp->datasets==2.21.0->-r requirements.txt (line 8)) (4.0.3) Requirement already satisfied: typing-extensions>=3.7.4.3 in /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages (from huggingface-hub>=0.21.2->datasets==2.21.0->-r requirements.txt (line 8)) (4.9.0) Requirement already satisfied: zipp>=0.5 in /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages (from importlib-metadata>=3.6.0->flask->-r requirements.txt (line 17)) (3.17.0) Requirement already satisfied: MarkupSafe>=2.0 in /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages (from Jinja2>=3.1.2->flask->-r requirements.txt (line 17)) (2.1.3) Requirement already satisfied: charset-normalizer<4,>=2 in /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages (from requests>=2.32.2->datasets==2.21.0->-r requirements.txt (line 8)) (3.3.2) Requirement already satisfied: idna<4,>=2.5 in /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages (from requests>=2.32.2->datasets==2.21.0->-r requirements.txt (line 8)) (3.6) Requirement already satisfied: urllib3<3,>=1.21.1 in /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages (from requests>=2.32.2->datasets==2.21.0->-r requirements.txt (line 8)) (2.1.0) Requirement already satisfied: certifi>=2017.4.17 in /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages (from requests>=2.32.2->datasets==2.21.0->-r requirements.txt (line 8)) (2023.11.17) Requirement already satisfied: sympy in /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages (from torch->deepspeed==0.14.2->-r requirements.txt (line 14)) (1.12) Requirement already satisfied: networkx in /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages (from torch->deepspeed==0.14.2->-r requirements.txt (line 14)) (3.1) Requirement already satisfied: tzdata>=2022.1 in /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages (from pandas->datasets==2.21.0->-r requirements.txt (line 8)) (2023.4) Requirement already satisfied: mpmath>=0.19 in /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages (from sympy->torch->deepspeed==0.14.2->-r requirements.txt (line 14)) (1.3.0) Building wheels for collected packages: deepspeed Building wheel for deepspeed (setup.py): started Building wheel for deepspeed (setup.py): finished with status 'done' Created wheel for deepspeed: filename=deepspeed-0.14.2-py3-none-any.whl size=1432137 sha256=e7fe43d9cecd7486b20a0b8de522fd4d16f4653e87258ae0bf154d9b37cff03c Stored in directory: /tmp/pip-ephem-wheel-cache-rkm9hv2m/wheels/54/55/f0/134d74ed2ef12f335a7806742c56604267a8186dfba6135e06 Successfully built deepspeed DEPRECATION: apex 0.1-ascend-20231124 has a non-standard version number. pip 24.0 will enforce this behaviour change. A possible replacement is to upgrade to a newer version of apex or contact the author to suggest that they release a version with a conforming version number. Discussion can be found at https://github.com/pypa/pip/issues/12063 Installing collected packages: aniso8601, xlsxwriter, tqdm, termcolor, tabulate, requests, pynvml, pyarrow, natsort, itsdangerous, decord, blinker, huggingface-hub, flask, tokenizers, flask_restful, deepspeed, accelerate, transformers, timm, datasets Attempting uninstall: tqdm Found existing installation: tqdm 4.66.1 Uninstalling tqdm-4.66.1: Successfully uninstalled tqdm-4.66.1 Attempting uninstall: requests Found existing installation: requests 2.31.0 Uninstalling requests-2.31.0: Successfully uninstalled requests-2.31.0 Attempting uninstall: pyarrow Found existing installation: pyarrow 14.0.2 Uninstalling pyarrow-14.0.2: Successfully uninstalled pyarrow-14.0.2 Attempting uninstall: huggingface-hub Found existing installation: huggingface-hub 0.20.2 Uninstalling huggingface-hub-0.20.2: Successfully uninstalled huggingface-hub-0.20.2 Attempting uninstall: tokenizers Found existing installation: tokenizers 0.13.3 Uninstalling tokenizers-0.13.3: Successfully uninstalled tokenizers-0.13.3 Attempting uninstall: accelerate Found existing installation: accelerate 0.24.0 Uninstalling accelerate-0.24.0: Successfully uninstalled accelerate-0.24.0 Attempting uninstall: transformers Found existing installation: transformers 4.33.0 Uninstalling transformers-4.33.0: Successfully uninstalled transformers-4.33.0 Attempting uninstall: datasets Found existing installation: datasets 2.16.1 Uninstalling datasets-2.16.1: Successfully uninstalled datasets-2.16.1 ERROR: pip's dependency resolver does not currently take into account all the packages that are installed. This behaviour is the source of the following dependency conflicts. tikit 1.8.2.240923 requires dicttoxml==1.7.4, which is not installed. tikit 1.8.2.240923 requires docopt==0.6.2, which is not installed. tikit 1.8.2.240923 requires future==0.18.2, which is not installed. tikit 1.8.2.240923 requires hdfs==2.6.0, which is not installed. tikit 1.8.2.240923 requires pure-sasl==0.6.2, which is not installed. tikit 1.8.2.240923 requires py4j==0.10.7, which is not installed. tikit 1.8.2.240923 requires PyHive[hive]==0.6.4, which is not installed. tikit 1.8.2.240923 requires pyjwt>=2.4.0, which is not installed. tikit 1.8.2.240923 requires requests-kerberos>=0.14.0, which is not installed. tikit 1.8.2.240923 requires sasl==0.3.1, which is not installed. tikit 1.8.2.240923 requires thrift==0.15.0, which is not installed. tikit 1.8.2.240923 requires thrift-sasl>=0.1.0, which is not installed. tikit 1.8.2.240923 requires certifi==2021.10.8, but you have certifi 2023.11.17 which is incompatible. tikit 1.8.2.240923 requires cos-python-sdk-v5==1.9.29, but you have cos-python-sdk-v5 1.9.27 which is incompatible. tikit 1.8.2.240923 requires idna==3.3, but you have idna 3.6 which is incompatible. tikit 1.8.2.240923 requires prettytable==2.5.0, but you have prettytable 3.10.0 which is incompatible. tikit 1.8.2.240923 requires urllib3==1.26.7, but you have urllib3 2.1.0 which is incompatible. tikit 1.8.2.240923 requires wcwidth==0.2.5, but you have wcwidth 0.2.13 which is incompatible. Successfully installed accelerate-0.29.3 aniso8601-9.0.1 blinker-1.8.2 datasets-2.21.0 decord-0.6.0 deepspeed-0.14.2 flask-3.0.3 flask_restful-0.3.10 huggingface-hub-0.25.2 itsdangerous-2.2.0 natsort-8.4.0 pyarrow-16.1.0 pynvml-11.5.0 requests-2.32.3 tabulate-0.9.0 termcolor-2.4.0 timm-1.0.7 tokenizers-0.19.1 tqdm-4.66.5 transformers-4.40.1 xlsxwriter-3.2.0 WARNING: Running pip as the 'root' user can result in broken permissions and conflicting behaviour with the system package manager. It is recommended to use a virtual environment instead: https://pip.pypa.io/warnings/venv + MEGATRON_DIR=/local_disk/cognitron_vl//third_party/Megatron-LM_core_r0.6.0/ + MINDSPEED_DIR=/local_disk/cognitron_vl//third_party/MindSpeed_core_r0.6.0/ + MODELLINK_DIR=/local_disk/cognitron_vl//third_party/ModelLink/ + pip3 install --no-index --find-links=/data/software/ -e /local_disk/cognitron_vl//third_party/Megatron-LM_core_r0.6.0/ Looking in links: /data/software/ Obtaining file://local_disk/cognitron_vl/third_party/Megatron-LM_core_r0.6.0 Installing build dependencies: started Installing build dependencies: finished with status 'done' Checking if build backend supports build_editable: started Checking if build backend supports build_editable: finished with status 'done' Getting requirements to build editable: started Getting requirements to build editable: finished with status 'done' Installing backend dependencies: started Installing backend dependencies: finished with status 'done' Preparing editable metadata (pyproject.toml): started Preparing editable metadata (pyproject.toml): finished with status 'done' Building wheels for collected packages: megatron_core Building editable for megatron_core (pyproject.toml): started Building editable for megatron_core (pyproject.toml): finished with status 'done' Created wheel for megatron_core: filename=megatron_core-0.6.0-0.editable-cp38-cp38-linux_x86_64.whl size=8790 sha256=ec3db0c411604d56cb57d3e697a6079b7ba03618581bfb835595650f8c3caf53 Stored in directory: /tmp/pip-ephem-wheel-cache-av7vvqxa/wheels/54/9c/d1/d2015aa0c34e791e64d65d19395e5a9a5528f0c63fd519b9ff Successfully built megatron_core DEPRECATION: apex 0.1-ascend-20231124 has a non-standard version number. pip 24.0 will enforce this behaviour change. A possible replacement is to upgrade to a newer version of apex or contact the author to suggest that they release a version with a conforming version number. Discussion can be found at https://github.com/pypa/pip/issues/12063 Installing collected packages: megatron_core Attempting uninstall: megatron_core Found existing installation: megatron-core 0.1.0 Uninstalling megatron-core-0.1.0: Successfully uninstalled megatron-core-0.1.0 Successfully installed megatron_core-0.6.0 WARNING: Running pip as the 'root' user can result in broken permissions and conflicting behaviour with the system package manager. It is recommended to use a virtual environment instead: https://pip.pypa.io/warnings/venv + pip3 install --no-index --find-links=/data/software/ -e /local_disk/cognitron_vl//third_party/MindSpeed_core_r0.6.0/ Looking in links: /data/software/ Obtaining file://local_disk/cognitron_vl/third_party/MindSpeed_core_r0.6.0 Preparing metadata (setup.py): started Preparing metadata (setup.py): finished with status 'done' WARNING: Error parsing requirements for tokenizers: [Errno 2] No such file or directory: '/root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages/tokenizers-0.19.1.dist-info/METADATA' WARNING: Error parsing requirements for transformers: [Errno 2] No such file or directory: '/root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages/transformers-4.40.1.dist-info/METADATA' DEPRECATION: apex 0.1-ascend-20231124 has a non-standard version number. pip 24.0 will enforce this behaviour change. A possible replacement is to upgrade to a newer version of apex or contact the author to suggest that they release a version with a conforming version number. Discussion can be found at https://github.com/pypa/pip/issues/12063 Installing collected packages: mindspeed Running setup.py develop for mindspeed Successfully installed mindspeed-0.6.0 WARNING: Running pip as the 'root' user can result in broken permissions and conflicting behaviour with the system package manager. It is recommended to use a virtual environment instead: https://pip.pypa.io/warnings/venv + pip3 install --no-index --find-links=/data/software/ -e /local_disk/cognitron_vl//third_party/ModelLink/ Looking in links: /data/software/ Obtaining file://local_disk/cognitron_vl/third_party/ModelLink Preparing metadata (setup.py): started Preparing metadata (setup.py): finished with status 'done' Requirement already satisfied: numpy in /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages (from modellink==0.0.1) (1.24.4) Processing data/software/transformers-4.43.2-py3-none-any.whl (from modellink==0.0.1) Requirement already satisfied: transformers_stream_generator in /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages (from modellink==0.0.1) (0.0.4) Requirement already satisfied: sympy in /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages (from modellink==0.0.1) (1.12) Requirement already satisfied: decorator in /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages (from modellink==0.0.1) (5.1.1) Requirement already satisfied: scipy in /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages (from modellink==0.0.1) (1.10.1) Requirement already satisfied: sentencepiece in /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages (from modellink==0.0.1) (0.1.99) Requirement already satisfied: einops in /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages (from modellink==0.0.1) (0.6.1) Requirement already satisfied: datasets in /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages (from modellink==0.0.1) (2.21.0) Requirement already satisfied: pybind11 in /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages (from modellink==0.0.1) (2.11.1) Requirement already satisfied: accelerate in /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages (from modellink==0.0.1) (0.29.3) Requirement already satisfied: six in /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages (from modellink==0.0.1) (1.16.0) Requirement already satisfied: protobuf in /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages (from modellink==0.0.1) (3.20.3) Processing data/software/peft-0.7.1-py3-none-any.whl (from modellink==0.0.1) Requirement already satisfied: tiktoken in /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages (from modellink==0.0.1) (0.5.2) Requirement already satisfied: packaging>=20.0 in /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages (from peft==0.7.1->modellink==0.0.1) (23.2) Requirement already satisfied: psutil in /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages (from peft==0.7.1->modellink==0.0.1) (5.9.7) Requirement already satisfied: pyyaml in /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages (from peft==0.7.1->modellink==0.0.1) (6.0.1) Requirement already satisfied: torch>=1.13.0 in /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages (from peft==0.7.1->modellink==0.0.1) (2.1.0+cpu) Requirement already satisfied: tqdm in /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages (from peft==0.7.1->modellink==0.0.1) (4.66.5) Requirement already satisfied: safetensors in /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages (from peft==0.7.1->modellink==0.0.1) (0.4.1) Requirement already satisfied: huggingface-hub>=0.17.0 in /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages (from peft==0.7.1->modellink==0.0.1) (0.25.2) Requirement already satisfied: filelock in /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages (from transformers==4.43.2->modellink==0.0.1) (3.13.1) Requirement already satisfied: regex!=2019.12.17 in /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages (from transformers==4.43.2->modellink==0.0.1) (2023.12.25) Requirement already satisfied: requests in /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages (from transformers==4.43.2->modellink==0.0.1) (2.32.3) Processing data/software/tokenizers-0.19.1-cp38-cp38-manylinux_2_17_x86_64.manylinux2014_x86_64.whl (from transformers==4.43.2->modellink==0.0.1) Requirement already satisfied: pyarrow>=15.0.0 in /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages (from datasets->modellink==0.0.1) (16.1.0) Requirement already satisfied: dill<0.3.9,>=0.3.0 in /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages (from datasets->modellink==0.0.1) (0.3.7) Requirement already satisfied: pandas in /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages (from datasets->modellink==0.0.1) (2.0.3) Requirement already satisfied: xxhash in /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages (from datasets->modellink==0.0.1) (3.4.1) Requirement already satisfied: multiprocess in /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages (from datasets->modellink==0.0.1) (0.70.15) Requirement already satisfied: fsspec<=2024.6.1,>=2023.1.0 in /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages (from fsspec[http]<=2024.6.1,>=2023.1.0->datasets->modellink==0.0.1) (2023.10.0) Requirement already satisfied: aiohttp in /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages (from datasets->modellink==0.0.1) (3.9.1) Requirement already satisfied: mpmath>=0.19 in /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages (from sympy->modellink==0.0.1) (1.3.0) Requirement already satisfied: attrs>=17.3.0 in /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages (from aiohttp->datasets->modellink==0.0.1) (23.2.0) Requirement already satisfied: multidict<7.0,>=4.5 in /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages (from aiohttp->datasets->modellink==0.0.1) (6.0.4) Requirement already satisfied: yarl<2.0,>=1.0 in /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages (from aiohttp->datasets->modellink==0.0.1) (1.9.4) Requirement already satisfied: frozenlist>=1.1.1 in /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages (from aiohttp->datasets->modellink==0.0.1) (1.4.1) Requirement already satisfied: aiosignal>=1.1.2 in /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages (from aiohttp->datasets->modellink==0.0.1) (1.3.1) Requirement already satisfied: async-timeout<5.0,>=4.0 in /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages (from aiohttp->datasets->modellink==0.0.1) (4.0.3) Requirement already satisfied: typing-extensions>=3.7.4.3 in /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages (from huggingface-hub>=0.17.0->peft==0.7.1->modellink==0.0.1) (4.9.0) Requirement already satisfied: charset-normalizer<4,>=2 in /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages (from requests->transformers==4.43.2->modellink==0.0.1) (3.3.2) Requirement already satisfied: idna<4,>=2.5 in /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages (from requests->transformers==4.43.2->modellink==0.0.1) (3.6) Requirement already satisfied: urllib3<3,>=1.21.1 in /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages (from requests->transformers==4.43.2->modellink==0.0.1) (2.1.0) Requirement already satisfied: certifi>=2017.4.17 in /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages (from requests->transformers==4.43.2->modellink==0.0.1) (2023.11.17) Requirement already satisfied: networkx in /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages (from torch>=1.13.0->peft==0.7.1->modellink==0.0.1) (3.1) Requirement already satisfied: jinja2 in /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages (from torch>=1.13.0->peft==0.7.1->modellink==0.0.1) (3.1.2) Requirement already satisfied: python-dateutil>=2.8.2 in /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages (from pandas->datasets->modellink==0.0.1) (2.8.2) Requirement already satisfied: pytz>=2020.1 in /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages (from pandas->datasets->modellink==0.0.1) (2023.3.post1) Requirement already satisfied: tzdata>=2022.1 in /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages (from pandas->datasets->modellink==0.0.1) (2023.4) Requirement already satisfied: MarkupSafe>=2.0 in /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages (from jinja2->torch>=1.13.0->peft==0.7.1->modellink==0.0.1) (2.1.3) DEPRECATION: apex 0.1-ascend-20231124 has a non-standard version number. pip 24.0 will enforce this behaviour change. A possible replacement is to upgrade to a newer version of apex or contact the author to suggest that they release a version with a conforming version number. Discussion can be found at https://github.com/pypa/pip/issues/12063 Installing collected packages: tokenizers, transformers, peft, modellink Attempting uninstall: tokenizers Found existing installation: tokenizers 0.20.1 Uninstalling tokenizers-0.20.1: Successfully uninstalled tokenizers-0.20.1 Attempting uninstall: transformers Found existing installation: transformers 4.45.2 Uninstalling transformers-4.45.2: Successfully uninstalled transformers-4.45.2 Attempting uninstall: peft Found existing installation: peft 0.5.0 Uninstalling peft-0.5.0: Successfully uninstalled peft-0.5.0 Running setup.py develop for modellink Successfully installed modellink-0.0.1 peft-0.7.1 tokenizers-0.19.1 transformers-4.43.2 WARNING: Running pip as the 'root' user can result in broken permissions and conflicting behaviour with the system package manager. It is recommended to use a virtual environment instead: https://pip.pypa.io/warnings/venv + export PYTHONPATH=/local_disk/cognitron_vl//third_party/Megatron-LM_core_r0.6.0//:/usr/local/Ascend/ascend-toolkit/latest/python/site-packages:/usr/local/Ascend/ascend-toolkit/latest/opp/built-in/op_impl/ai_core/tbe:/usr/local/Ascend/ascend-toolkit/latest/python/site-packages:/usr/local/Ascend/ascend-toolkit/latest/opp/built-in/op_impl/ai_core/tbe:/usr/local/Ascend/ascend-toolkit/latest/opp/op_impl/built-in/ai_core/tbe: + PYTHONPATH=/local_disk/cognitron_vl//third_party/Megatron-LM_core_r0.6.0//:/usr/local/Ascend/ascend-toolkit/latest/python/site-packages:/usr/local/Ascend/ascend-toolkit/latest/opp/built-in/op_impl/ai_core/tbe:/usr/local/Ascend/ascend-toolkit/latest/python/site-packages:/usr/local/Ascend/ascend-toolkit/latest/opp/built-in/op_impl/ai_core/tbe:/usr/local/Ascend/ascend-toolkit/latest/opp/op_impl/built-in/ai_core/tbe: + GPUS_PER_NODE=16 + NNODES=12 + NODE_RANK=9 + MASTER_PORT=34567 + export CUDA_DEVICE_MAX_CONNECTIONS=1 + CUDA_DEVICE_MAX_CONNECTIONS=1 + VISION_SEQ_LENGTH=1025 + IMAGE_TOKEN_LENGTH=256 + IMAGE_SIZE=448 + VISION_MODEL_TYPE=intern_300m + TP=8 + PP=1 + DISTRIBUTED_ARGS=' --nproc_per_node 16 --nnodes 12 --node_rank 9 --master_addr train-1165841964676693248-8uvcht9qqrr4-master-0.train-100034032793.svc.cluster.local --master_port 34567 ' + GPT_ARGS=' --use-mcore-models --tensor-model-parallel-size 8 --pipeline-model-parallel-size 1 --sequence-parallel --num-layers 48 --hidden-size 5120 --ffn-hidden-size 13824 --num-attention-heads 40 --add-qkv-bias --group-query-attention --num-query-groups 8 --tokenizer-type PretrainedFromHF --tokenizer-name-or-path /data_4/models/Qwen/Qwen2.5-14B-Instruct/ --seq-length 16384 --max-position-embeddings 16384 --micro-batch-size 1 --global-batch-size 528 --make-vocab-size-divisible-by 1 --padded-vocab-size 152064 --lr 1.00e-5 --train-iters 7000 --lr-decay-style cosine --untie-embeddings-and-output-weights --disable-bias-linear --attention-dropout 0.0 --init-method-std 0.01 --hidden-dropout 0.0 --position-embedding-type rope --rotary-base 1000000.0 --normalization RMSNorm --norm-epsilon 1e-6 --use-fused-rmsnorm --use-fused-swiglu --use-fused-rotary-pos-emb --use-rotary-position-embeddings --use-mc2 --swiglu --use-flash-attn --no-masked-softmax-fusion --attention-softmax-in-fp32 --min-lr 1.00e-7 --weight-decay 0.0 --lr-warmup-fraction 0.03 --clip-grad 1.0 --adam-beta1 0.9 --initial-loss-scale 4096 --adam-beta2 0.999 --no-gradient-accumulation-fusion --use-distributed-optimizer --bf16 --overlap-grad-reduce --finetune --vision-model-lr-mult 0.1 --vision-model-lr-decay-rate 0.9 --vision-model-type intern_300m --vision-downsample-ratio 0.5 --vision-projection-type mlp --vision-projection-pre-norm --vision-process-type dynamic --vision-normalize-type imagenet --vision-seq-length 1025 --image-token-length 256 --image-size 448 --prompt-format qwen2 --is-instruction-dataset --max-num-image 64 --max-num-frame 64 --max-fps 1 --add-class-token --reset-position-ids --reset-attention-mask --min-patch-grid 1 --max-patch-grid 12 ' + DATA_ARGS=' --data-path /local_disk/cognitron_vl//configs/lcvlm_finetune_stage2.yaml --split 100,0,0 --data-seq-length 16384 --num-workers 8 ' + CKPT_ARGS=' --load /data_2/output/LM/lcvlm_modellink/scripts/qwen25/pretrain_qwen25_14b_intern_300m_ptd_tp8pp1_stage1.sh/20241012_095536/ --vit-load / --no-load-optim --no-load-rng --seed 42 --save /data_2/output/LM/lcvlm_modellink/scripts/qwen25/finetune_qwen25_14b_intern_300m_ptd_tp8pp1_stage2.sh/20241014_131952// ' + OUTPUT_ARGS=' --log-interval 1 --save-interval 500 --eval-interval 500 --eval-iters 0 --log-throughput --distributed-timeout-minutes 120 ' + torchrun --nproc_per_node 16 --nnodes 12 --node_rank 9 --master_addr train-1165841964676693248-8uvcht9qqrr4-master-0.train-100034032793.svc.cluster.local --master_port 34567 /local_disk/cognitron_vl//lcvlm_modellink/pretrain_lcvlm.py --use-mcore-models --tensor-model-parallel-size 8 --pipeline-model-parallel-size 1 --sequence-parallel --num-layers 48 --hidden-size 5120 --ffn-hidden-size 13824 --num-attention-heads 40 --add-qkv-bias --group-query-attention --num-query-groups 8 --tokenizer-type PretrainedFromHF --tokenizer-name-or-path /data_4/models/Qwen/Qwen2.5-14B-Instruct/ --seq-length 16384 --max-position-embeddings 16384 --micro-batch-size 1 --global-batch-size 528 --make-vocab-size-divisible-by 1 --padded-vocab-size 152064 --lr 1.00e-5 --train-iters 7000 --lr-decay-style cosine --untie-embeddings-and-output-weights --disable-bias-linear --attention-dropout 0.0 --init-method-std 0.01 --hidden-dropout 0.0 --position-embedding-type rope --rotary-base 1000000.0 --normalization RMSNorm --norm-epsilon 1e-6 --use-fused-rmsnorm --use-fused-swiglu --use-fused-rotary-pos-emb --use-rotary-position-embeddings --use-mc2 --swiglu --use-flash-attn --no-masked-softmax-fusion --attention-softmax-in-fp32 --min-lr 1.00e-7 --weight-decay 0.0 --lr-warmup-fraction 0.03 --clip-grad 1.0 --adam-beta1 0.9 --initial-loss-scale 4096 --adam-beta2 0.999 --no-gradient-accumulation-fusion --use-distributed-optimizer --bf16 --overlap-grad-reduce --finetune --vision-model-lr-mult 0.1 --vision-model-lr-decay-rate 0.9 --vision-model-type intern_300m --vision-downsample-ratio 0.5 --vision-projection-type mlp --vision-projection-pre-norm --vision-process-type dynamic --vision-normalize-type imagenet --vision-seq-length 1025 --image-token-length 256 --image-size 448 --prompt-format qwen2 --is-instruction-dataset --max-num-image 64 --max-num-frame 64 --max-fps 1 --add-class-token --reset-position-ids --reset-attention-mask --min-patch-grid 1 --max-patch-grid 12 --data-path /local_disk/cognitron_vl//configs/lcvlm_finetune_stage2.yaml --split 100,0,0 --data-seq-length 16384 --num-workers 8 --load /data_2/output/LM/lcvlm_modellink/scripts/qwen25/pretrain_qwen25_14b_intern_300m_ptd_tp8pp1_stage1.sh/20241012_095536/ --vit-load / --no-load-optim --no-load-rng --seed 42 --save /data_2/output/LM/lcvlm_modellink/scripts/qwen25/finetune_qwen25_14b_intern_300m_ptd_tp8pp1_stage2.sh/20241014_131952// --log-interval 1 --save-interval 500 --eval-interval 500 --eval-iters 0 --log-throughput --distributed-timeout-minutes 120 --distributed-backend nccl [2024-10-14 13:23:18,621] torch.distributed.run: [WARNING] [2024-10-14 13:23:18,621] torch.distributed.run: [WARNING] ***************************************** [2024-10-14 13:23:18,621] torch.distributed.run: [WARNING] Setting OMP_NUM_THREADS environment variable for each process to be 1 in default, to avoid your system being overloaded, please further tune the variable for optimal performance in your application as needed. [2024-10-14 13:23:18,621] torch.distributed.run: [WARNING] ***************************************** /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages/torch_npu/contrib/transfer_to_npu.py:260: RuntimeWarning: torch.jit.script and torch.jit.script_method will be disabled by transfer_to_npu, which currently does not support them, if you need to enable them, please do not use transfer_to_npu. warnings.warn(msg, RuntimeWarning) /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages/torch_npu/contrib/transfer_to_npu.py:260: RuntimeWarning: torch.jit.script and torch.jit.script_method will be disabled by transfer_to_npu, which currently does not support them, if you need to enable them, please do not use transfer_to_npu. warnings.warn(msg, RuntimeWarning) /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages/torch_npu/contrib/transfer_to_npu.py:260: RuntimeWarning: torch.jit.script and torch.jit.script_method will be disabled by transfer_to_npu, which currently does not support them, if you need to enable them, please do not use transfer_to_npu. warnings.warn(msg, RuntimeWarning) /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages/torch_npu/contrib/transfer_to_npu.py:260: RuntimeWarning: torch.jit.script and torch.jit.script_method will be disabled by transfer_to_npu, which currently does not support them, if you need to enable them, please do not use transfer_to_npu. warnings.warn(msg, RuntimeWarning) /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages/torch_npu/contrib/transfer_to_npu.py:260: RuntimeWarning: torch.jit.script and torch.jit.script_method will be disabled by transfer_to_npu, which currently does not support them, if you need to enable them, please do not use transfer_to_npu. warnings.warn(msg, RuntimeWarning) /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages/torch_npu/contrib/transfer_to_npu.py:260: RuntimeWarning: torch.jit.script and torch.jit.script_method will be disabled by transfer_to_npu, which currently does not support them, if you need to enable them, please do not use transfer_to_npu. warnings.warn(msg, RuntimeWarning) /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages/torch_npu/contrib/transfer_to_npu.py:260: RuntimeWarning: torch.jit.script and torch.jit.script_method will be disabled by transfer_to_npu, which currently does not support them, if you need to enable them, please do not use transfer_to_npu. warnings.warn(msg, RuntimeWarning) /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages/torch_npu/contrib/transfer_to_npu.py:260: RuntimeWarning: torch.jit.script and torch.jit.script_method will be disabled by transfer_to_npu, which currently does not support them, if you need to enable them, please do not use transfer_to_npu. warnings.warn(msg, RuntimeWarning) /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages/torch_npu/contrib/transfer_to_npu.py:260: RuntimeWarning: torch.jit.script and torch.jit.script_method will be disabled by transfer_to_npu, which currently does not support them, if you need to enable them, please do not use transfer_to_npu. warnings.warn(msg, RuntimeWarning) /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages/torch_npu/contrib/transfer_to_npu.py:260: RuntimeWarning: torch.jit.script and torch.jit.script_method will be disabled by transfer_to_npu, which currently does not support them, if you need to enable them, please do not use transfer_to_npu. warnings.warn(msg, RuntimeWarning) /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages/torch_npu/contrib/transfer_to_npu.py:260: RuntimeWarning: torch.jit.script and torch.jit.script_method will be disabled by transfer_to_npu, which currently does not support them, if you need to enable them, please do not use transfer_to_npu. warnings.warn(msg, RuntimeWarning) /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages/torch_npu/contrib/transfer_to_npu.py:260: RuntimeWarning: torch.jit.script and torch.jit.script_method will be disabled by transfer_to_npu, which currently does not support them, if you need to enable them, please do not use transfer_to_npu. warnings.warn(msg, RuntimeWarning) /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages/torch_npu/contrib/transfer_to_npu.py:260: RuntimeWarning: torch.jit.script and torch.jit.script_method will be disabled by transfer_to_npu, which currently does not support them, if you need to enable them, please do not use transfer_to_npu. warnings.warn(msg, RuntimeWarning) /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages/torch_npu/contrib/transfer_to_npu.py:260: RuntimeWarning: torch.jit.script and torch.jit.script_method will be disabled by transfer_to_npu, which currently does not support them, if you need to enable them, please do not use transfer_to_npu. warnings.warn(msg, RuntimeWarning) /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages/torch_npu/contrib/transfer_to_npu.py:260: RuntimeWarning: torch.jit.script and torch.jit.script_method will be disabled by transfer_to_npu, which currently does not support them, if you need to enable them, please do not use transfer_to_npu. warnings.warn(msg, RuntimeWarning) /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages/torch_npu/contrib/transfer_to_npu.py:260: RuntimeWarning: torch.jit.script and torch.jit.script_method will be disabled by transfer_to_npu, which currently does not support them, if you need to enable them, please do not use transfer_to_npu. warnings.warn(msg, RuntimeWarning) local_disk/cognitron_vl/third_party/Megatron-LM_core_r0.6.0/megatron/core/transformer/custom_layers/transformer_engine.py:10: DeprecationWarning: pkg_resources is deprecated as an API. See https://setuptools.pypa.io/en/latest/pkg_resources.html from pkg_resources import packaging local_disk/cognitron_vl/third_party/Megatron-LM_core_r0.6.0/megatron/core/transformer/custom_layers/transformer_engine.py:10: DeprecationWarning: pkg_resources is deprecated as an API. See https://setuptools.pypa.io/en/latest/pkg_resources.html from pkg_resources import packaging local_disk/cognitron_vl/third_party/Megatron-LM_core_r0.6.0/megatron/core/transformer/custom_layers/transformer_engine.py:10: DeprecationWarning: pkg_resources is deprecated as an API. See https://setuptools.pypa.io/en/latest/pkg_resources.html from pkg_resources import packaging /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages/pkg_resources/__init__.py:2871: DeprecationWarning: Deprecated call to `pkg_resources.declare_namespace('mpl_toolkits')`. Implementing implicit namespace packages (as specified in PEP 420) is preferred to `pkg_resources.declare_namespace`. See https://setuptools.pypa.io/en/latest/references/keywords.html#keyword-namespace-packages declare_namespace(pkg) /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages/pkg_resources/__init__.py:2871: DeprecationWarning: Deprecated call to `pkg_resources.declare_namespace('mpl_toolkits')`. Implementing implicit namespace packages (as specified in PEP 420) is preferred to `pkg_resources.declare_namespace`. See https://setuptools.pypa.io/en/latest/references/keywords.html#keyword-namespace-packages declare_namespace(pkg) /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages/pkg_resources/__init__.py:2871: DeprecationWarning: Deprecated call to `pkg_resources.declare_namespace('mpl_toolkits')`. Implementing implicit namespace packages (as specified in PEP 420) is preferred to `pkg_resources.declare_namespace`. See https://setuptools.pypa.io/en/latest/references/keywords.html#keyword-namespace-packages declare_namespace(pkg) /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages/pkg_resources/__init__.py:2871: DeprecationWarning: Deprecated call to `pkg_resources.declare_namespace('google')`. Implementing implicit namespace packages (as specified in PEP 420) is preferred to `pkg_resources.declare_namespace`. See https://setuptools.pypa.io/en/latest/references/keywords.html#keyword-namespace-packages declare_namespace(pkg) /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages/pkg_resources/__init__.py:2871: DeprecationWarning: Deprecated call to `pkg_resources.declare_namespace('google')`. Implementing implicit namespace packages (as specified in PEP 420) is preferred to `pkg_resources.declare_namespace`. See https://setuptools.pypa.io/en/latest/references/keywords.html#keyword-namespace-packages declare_namespace(pkg) /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages/pkg_resources/__init__.py:2871: DeprecationWarning: Deprecated call to `pkg_resources.declare_namespace('google')`. Implementing implicit namespace packages (as specified in PEP 420) is preferred to `pkg_resources.declare_namespace`. See https://setuptools.pypa.io/en/latest/references/keywords.html#keyword-namespace-packages declare_namespace(pkg) local_disk/cognitron_vl/third_party/Megatron-LM_core_r0.6.0/megatron/core/transformer/custom_layers/transformer_engine.py:10: DeprecationWarning: pkg_resources is deprecated as an API. See https://setuptools.pypa.io/en/latest/pkg_resources.html from pkg_resources import packaging /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages/pkg_resources/__init__.py:2871: DeprecationWarning: Deprecated call to `pkg_resources.declare_namespace('zope')`. Implementing implicit namespace packages (as specified in PEP 420) is preferred to `pkg_resources.declare_namespace`. See https://setuptools.pypa.io/en/latest/references/keywords.html#keyword-namespace-packages declare_namespace(pkg) /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages/pkg_resources/__init__.py:2871: DeprecationWarning: Deprecated call to `pkg_resources.declare_namespace('zope')`. Implementing implicit namespace packages (as specified in PEP 420) is preferred to `pkg_resources.declare_namespace`. See https://setuptools.pypa.io/en/latest/references/keywords.html#keyword-namespace-packages declare_namespace(pkg) /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages/pkg_resources/__init__.py:2871: DeprecationWarning: Deprecated call to `pkg_resources.declare_namespace('zope')`. Implementing implicit namespace packages (as specified in PEP 420) is preferred to `pkg_resources.declare_namespace`. See https://setuptools.pypa.io/en/latest/references/keywords.html#keyword-namespace-packages declare_namespace(pkg) /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages/pkg_resources/__init__.py:2871: DeprecationWarning: Deprecated call to `pkg_resources.declare_namespace('mpl_toolkits')`. Implementing implicit namespace packages (as specified in PEP 420) is preferred to `pkg_resources.declare_namespace`. See https://setuptools.pypa.io/en/latest/references/keywords.html#keyword-namespace-packages declare_namespace(pkg) /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages/pkg_resources/__init__.py:2871: DeprecationWarning: Deprecated call to `pkg_resources.declare_namespace('google')`. Implementing implicit namespace packages (as specified in PEP 420) is preferred to `pkg_resources.declare_namespace`. See https://setuptools.pypa.io/en/latest/references/keywords.html#keyword-namespace-packages declare_namespace(pkg) /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages/pkg_resources/__init__.py:2871: DeprecationWarning: Deprecated call to `pkg_resources.declare_namespace('zope')`. Implementing implicit namespace packages (as specified in PEP 420) is preferred to `pkg_resources.declare_namespace`. See https://setuptools.pypa.io/en/latest/references/keywords.html#keyword-namespace-packages declare_namespace(pkg) local_disk/cognitron_vl/third_party/Megatron-LM_core_r0.6.0/megatron/core/transformer/custom_layers/transformer_engine.py:10: DeprecationWarning: pkg_resources is deprecated as an API. See https://setuptools.pypa.io/en/latest/pkg_resources.html from pkg_resources import packaging local_disk/cognitron_vl/third_party/Megatron-LM_core_r0.6.0/megatron/core/transformer/custom_layers/transformer_engine.py:10: DeprecationWarning: pkg_resources is deprecated as an API. See https://setuptools.pypa.io/en/latest/pkg_resources.html from pkg_resources import packaging local_disk/cognitron_vl/third_party/Megatron-LM_core_r0.6.0/megatron/core/transformer/custom_layers/transformer_engine.py:10: DeprecationWarning: pkg_resources is deprecated as an API. See https://setuptools.pypa.io/en/latest/pkg_resources.html from pkg_resources import packaging local_disk/cognitron_vl/third_party/Megatron-LM_core_r0.6.0/megatron/core/transformer/custom_layers/transformer_engine.py:10: DeprecationWarning: pkg_resources is deprecated as an API. See https://setuptools.pypa.io/en/latest/pkg_resources.html from pkg_resources import packaging local_disk/cognitron_vl/third_party/Megatron-LM_core_r0.6.0/megatron/core/transformer/custom_layers/transformer_engine.py:10: DeprecationWarning: pkg_resources is deprecated as an API. See https://setuptools.pypa.io/en/latest/pkg_resources.html from pkg_resources import packaging local_disk/cognitron_vl/third_party/Megatron-LM_core_r0.6.0/megatron/core/transformer/custom_layers/transformer_engine.py:10: DeprecationWarning: pkg_resources is deprecated as an API. See https://setuptools.pypa.io/en/latest/pkg_resources.html from pkg_resources import packaging local_disk/cognitron_vl/third_party/Megatron-LM_core_r0.6.0/megatron/core/transformer/custom_layers/transformer_engine.py:10: DeprecationWarning: pkg_resources is deprecated as an API. See https://setuptools.pypa.io/en/latest/pkg_resources.html from pkg_resources import packaging /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages/pkg_resources/__init__.py:2871: DeprecationWarning: Deprecated call to `pkg_resources.declare_namespace('mpl_toolkits')`. Implementing implicit namespace packages (as specified in PEP 420) is preferred to `pkg_resources.declare_namespace`. See https://setuptools.pypa.io/en/latest/references/keywords.html#keyword-namespace-packages declare_namespace(pkg) /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages/pkg_resources/__init__.py:2871: DeprecationWarning: Deprecated call to `pkg_resources.declare_namespace('mpl_toolkits')`. Implementing implicit namespace packages (as specified in PEP 420) is preferred to `pkg_resources.declare_namespace`. See https://setuptools.pypa.io/en/latest/references/keywords.html#keyword-namespace-packages declare_namespace(pkg) /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages/pkg_resources/__init__.py:2871: DeprecationWarning: Deprecated call to `pkg_resources.declare_namespace('mpl_toolkits')`. Implementing implicit namespace packages (as specified in PEP 420) is preferred to `pkg_resources.declare_namespace`. See https://setuptools.pypa.io/en/latest/references/keywords.html#keyword-namespace-packages declare_namespace(pkg) /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages/pkg_resources/__init__.py:2871: DeprecationWarning: Deprecated call to `pkg_resources.declare_namespace('google')`. Implementing implicit namespace packages (as specified in PEP 420) is preferred to `pkg_resources.declare_namespace`. See https://setuptools.pypa.io/en/latest/references/keywords.html#keyword-namespace-packages declare_namespace(pkg) /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages/pkg_resources/__init__.py:2871: DeprecationWarning: Deprecated call to `pkg_resources.declare_namespace('google')`. Implementing implicit namespace packages (as specified in PEP 420) is preferred to `pkg_resources.declare_namespace`. See https://setuptools.pypa.io/en/latest/references/keywords.html#keyword-namespace-packages declare_namespace(pkg) /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages/pkg_resources/__init__.py:2871: DeprecationWarning: Deprecated call to `pkg_resources.declare_namespace('google')`. Implementing implicit namespace packages (as specified in PEP 420) is preferred to `pkg_resources.declare_namespace`. See https://setuptools.pypa.io/en/latest/references/keywords.html#keyword-namespace-packages declare_namespace(pkg) local_disk/cognitron_vl/third_party/Megatron-LM_core_r0.6.0/megatron/core/transformer/custom_layers/transformer_engine.py:10: DeprecationWarning: pkg_resources is deprecated as an API. See https://setuptools.pypa.io/en/latest/pkg_resources.html from pkg_resources import packaging /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages/pkg_resources/__init__.py:2871: DeprecationWarning: Deprecated call to `pkg_resources.declare_namespace('mpl_toolkits')`. Implementing implicit namespace packages (as specified in PEP 420) is preferred to `pkg_resources.declare_namespace`. See https://setuptools.pypa.io/en/latest/references/keywords.html#keyword-namespace-packages declare_namespace(pkg) /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages/pkg_resources/__init__.py:2871: DeprecationWarning: Deprecated call to `pkg_resources.declare_namespace('mpl_toolkits')`. Implementing implicit namespace packages (as specified in PEP 420) is preferred to `pkg_resources.declare_namespace`. See https://setuptools.pypa.io/en/latest/references/keywords.html#keyword-namespace-packages declare_namespace(pkg) /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages/pkg_resources/__init__.py:2871: DeprecationWarning: Deprecated call to `pkg_resources.declare_namespace('google')`. Implementing implicit namespace packages (as specified in PEP 420) is preferred to `pkg_resources.declare_namespace`. See https://setuptools.pypa.io/en/latest/references/keywords.html#keyword-namespace-packages declare_namespace(pkg) /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages/pkg_resources/__init__.py:2871: DeprecationWarning: Deprecated call to `pkg_resources.declare_namespace('google')`. Implementing implicit namespace packages (as specified in PEP 420) is preferred to `pkg_resources.declare_namespace`. See https://setuptools.pypa.io/en/latest/references/keywords.html#keyword-namespace-packages declare_namespace(pkg) /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages/pkg_resources/__init__.py:2871: DeprecationWarning: Deprecated call to `pkg_resources.declare_namespace('zope')`. Implementing implicit namespace packages (as specified in PEP 420) is preferred to `pkg_resources.declare_namespace`. See https://setuptools.pypa.io/en/latest/references/keywords.html#keyword-namespace-packages declare_namespace(pkg) /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages/pkg_resources/__init__.py:2871: DeprecationWarning: Deprecated call to `pkg_resources.declare_namespace('zope')`. Implementing implicit namespace packages (as specified in PEP 420) is preferred to `pkg_resources.declare_namespace`. See https://setuptools.pypa.io/en/latest/references/keywords.html#keyword-namespace-packages declare_namespace(pkg) /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages/pkg_resources/__init__.py:2871: DeprecationWarning: Deprecated call to `pkg_resources.declare_namespace('zope')`. Implementing implicit namespace packages (as specified in PEP 420) is preferred to `pkg_resources.declare_namespace`. See https://setuptools.pypa.io/en/latest/references/keywords.html#keyword-namespace-packages declare_namespace(pkg) local_disk/cognitron_vl/third_party/Megatron-LM_core_r0.6.0/megatron/core/transformer/custom_layers/transformer_engine.py:10: DeprecationWarning: pkg_resources is deprecated as an API. See https://setuptools.pypa.io/en/latest/pkg_resources.html from pkg_resources import packaging /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages/pkg_resources/__init__.py:2871: DeprecationWarning: Deprecated call to `pkg_resources.declare_namespace('mpl_toolkits')`. Implementing implicit namespace packages (as specified in PEP 420) is preferred to `pkg_resources.declare_namespace`. See https://setuptools.pypa.io/en/latest/references/keywords.html#keyword-namespace-packages declare_namespace(pkg) /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages/pkg_resources/__init__.py:2871: DeprecationWarning: Deprecated call to `pkg_resources.declare_namespace('zope')`. Implementing implicit namespace packages (as specified in PEP 420) is preferred to `pkg_resources.declare_namespace`. See https://setuptools.pypa.io/en/latest/references/keywords.html#keyword-namespace-packages declare_namespace(pkg) /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages/pkg_resources/__init__.py:2871: DeprecationWarning: Deprecated call to `pkg_resources.declare_namespace('google')`. Implementing implicit namespace packages (as specified in PEP 420) is preferred to `pkg_resources.declare_namespace`. See https://setuptools.pypa.io/en/latest/references/keywords.html#keyword-namespace-packages declare_namespace(pkg) /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages/pkg_resources/__init__.py:2871: DeprecationWarning: Deprecated call to `pkg_resources.declare_namespace('zope')`. Implementing implicit namespace packages (as specified in PEP 420) is preferred to `pkg_resources.declare_namespace`. See https://setuptools.pypa.io/en/latest/references/keywords.html#keyword-namespace-packages declare_namespace(pkg) local_disk/cognitron_vl/third_party/Megatron-LM_core_r0.6.0/megatron/core/transformer/custom_layers/transformer_engine.py:10: DeprecationWarning: pkg_resources is deprecated as an API. See https://setuptools.pypa.io/en/latest/pkg_resources.html from pkg_resources import packaging /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages/pkg_resources/__init__.py:2871: DeprecationWarning: Deprecated call to `pkg_resources.declare_namespace('mpl_toolkits')`. Implementing implicit namespace packages (as specified in PEP 420) is preferred to `pkg_resources.declare_namespace`. See https://setuptools.pypa.io/en/latest/references/keywords.html#keyword-namespace-packages declare_namespace(pkg) /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages/pkg_resources/__init__.py:2871: DeprecationWarning: Deprecated call to `pkg_resources.declare_namespace('google')`. Implementing implicit namespace packages (as specified in PEP 420) is preferred to `pkg_resources.declare_namespace`. See https://setuptools.pypa.io/en/latest/references/keywords.html#keyword-namespace-packages declare_namespace(pkg) local_disk/cognitron_vl/third_party/Megatron-LM_core_r0.6.0/megatron/core/transformer/custom_layers/transformer_engine.py:10: DeprecationWarning: pkg_resources is deprecated as an API. See https://setuptools.pypa.io/en/latest/pkg_resources.html from pkg_resources import packaging /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages/pkg_resources/__init__.py:2871: DeprecationWarning: Deprecated call to `pkg_resources.declare_namespace('zope')`. Implementing implicit namespace packages (as specified in PEP 420) is preferred to `pkg_resources.declare_namespace`. See https://setuptools.pypa.io/en/latest/references/keywords.html#keyword-namespace-packages declare_namespace(pkg) /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages/pkg_resources/__init__.py:2871: DeprecationWarning: Deprecated call to `pkg_resources.declare_namespace('mpl_toolkits')`. Implementing implicit namespace packages (as specified in PEP 420) is preferred to `pkg_resources.declare_namespace`. See https://setuptools.pypa.io/en/latest/references/keywords.html#keyword-namespace-packages declare_namespace(pkg) /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages/pkg_resources/__init__.py:2871: DeprecationWarning: Deprecated call to `pkg_resources.declare_namespace('google')`. Implementing implicit namespace packages (as specified in PEP 420) is preferred to `pkg_resources.declare_namespace`. See https://setuptools.pypa.io/en/latest/references/keywords.html#keyword-namespace-packages declare_namespace(pkg) /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages/pkg_resources/__init__.py:2871: DeprecationWarning: Deprecated call to `pkg_resources.declare_namespace('zope')`. Implementing implicit namespace packages (as specified in PEP 420) is preferred to `pkg_resources.declare_namespace`. See https://setuptools.pypa.io/en/latest/references/keywords.html#keyword-namespace-packages declare_namespace(pkg) /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages/pkg_resources/__init__.py:2871: DeprecationWarning: Deprecated call to `pkg_resources.declare_namespace('zope')`. Implementing implicit namespace packages (as specified in PEP 420) is preferred to `pkg_resources.declare_namespace`. See https://setuptools.pypa.io/en/latest/references/keywords.html#keyword-namespace-packages declare_namespace(pkg) /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages/pkg_resources/__init__.py:2871: DeprecationWarning: Deprecated call to `pkg_resources.declare_namespace('mpl_toolkits')`. Implementing implicit namespace packages (as specified in PEP 420) is preferred to `pkg_resources.declare_namespace`. See https://setuptools.pypa.io/en/latest/references/keywords.html#keyword-namespace-packages declare_namespace(pkg) /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages/pkg_resources/__init__.py:2871: DeprecationWarning: Deprecated call to `pkg_resources.declare_namespace('google')`. Implementing implicit namespace packages (as specified in PEP 420) is preferred to `pkg_resources.declare_namespace`. See https://setuptools.pypa.io/en/latest/references/keywords.html#keyword-namespace-packages declare_namespace(pkg) /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages/pkg_resources/__init__.py:2871: DeprecationWarning: Deprecated call to `pkg_resources.declare_namespace('mpl_toolkits')`. Implementing implicit namespace packages (as specified in PEP 420) is preferred to `pkg_resources.declare_namespace`. See https://setuptools.pypa.io/en/latest/references/keywords.html#keyword-namespace-packages declare_namespace(pkg) /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages/pkg_resources/__init__.py:2871: DeprecationWarning: Deprecated call to `pkg_resources.declare_namespace('google')`. Implementing implicit namespace packages (as specified in PEP 420) is preferred to `pkg_resources.declare_namespace`. See https://setuptools.pypa.io/en/latest/references/keywords.html#keyword-namespace-packages declare_namespace(pkg) local_disk/cognitron_vl/third_party/Megatron-LM_core_r0.6.0/megatron/core/transformer/custom_layers/transformer_engine.py:10: DeprecationWarning: pkg_resources is deprecated as an API. See https://setuptools.pypa.io/en/latest/pkg_resources.html from pkg_resources import packaging /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages/pkg_resources/__init__.py:2871: DeprecationWarning: Deprecated call to `pkg_resources.declare_namespace('mpl_toolkits')`. Implementing implicit namespace packages (as specified in PEP 420) is preferred to `pkg_resources.declare_namespace`. See https://setuptools.pypa.io/en/latest/references/keywords.html#keyword-namespace-packages declare_namespace(pkg) /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages/pkg_resources/__init__.py:2871: DeprecationWarning: Deprecated call to `pkg_resources.declare_namespace('zope')`. Implementing implicit namespace packages (as specified in PEP 420) is preferred to `pkg_resources.declare_namespace`. See https://setuptools.pypa.io/en/latest/references/keywords.html#keyword-namespace-packages declare_namespace(pkg) /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages/pkg_resources/__init__.py:2871: DeprecationWarning: Deprecated call to `pkg_resources.declare_namespace('google')`. Implementing implicit namespace packages (as specified in PEP 420) is preferred to `pkg_resources.declare_namespace`. See https://setuptools.pypa.io/en/latest/references/keywords.html#keyword-namespace-packages declare_namespace(pkg) /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages/pkg_resources/__init__.py:2871: DeprecationWarning: Deprecated call to `pkg_resources.declare_namespace('zope')`. Implementing implicit namespace packages (as specified in PEP 420) is preferred to `pkg_resources.declare_namespace`. See https://setuptools.pypa.io/en/latest/references/keywords.html#keyword-namespace-packages declare_namespace(pkg) /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages/pkg_resources/__init__.py:2871: DeprecationWarning: Deprecated call to `pkg_resources.declare_namespace('zope')`. Implementing implicit namespace packages (as specified in PEP 420) is preferred to `pkg_resources.declare_namespace`. See https://setuptools.pypa.io/en/latest/references/keywords.html#keyword-namespace-packages declare_namespace(pkg) /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages/pkg_resources/__init__.py:2871: DeprecationWarning: Deprecated call to `pkg_resources.declare_namespace('mpl_toolkits')`. Implementing implicit namespace packages (as specified in PEP 420) is preferred to `pkg_resources.declare_namespace`. See https://setuptools.pypa.io/en/latest/references/keywords.html#keyword-namespace-packages declare_namespace(pkg) /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages/pkg_resources/__init__.py:2871: DeprecationWarning: Deprecated call to `pkg_resources.declare_namespace('google')`. Implementing implicit namespace packages (as specified in PEP 420) is preferred to `pkg_resources.declare_namespace`. See https://setuptools.pypa.io/en/latest/references/keywords.html#keyword-namespace-packages declare_namespace(pkg) /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages/pkg_resources/__init__.py:2871: DeprecationWarning: Deprecated call to `pkg_resources.declare_namespace('zope')`. Implementing implicit namespace packages (as specified in PEP 420) is preferred to `pkg_resources.declare_namespace`. See https://setuptools.pypa.io/en/latest/references/keywords.html#keyword-namespace-packages declare_namespace(pkg) /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages/torchvision/io/image.py:13: UserWarning: Failed to load image Python extension: 'libc10_cuda.so: cannot open shared object file: No such file or directory'If you don't plan on using image functionality from `torchvision.io`, you can ignore this warning. Otherwise, there might be something wrong with your environment. Did you have `libjpeg` or `libpng` installed before building `torchvision` from source? warn( /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages/torchvision/io/image.py:13: UserWarning: Failed to load image Python extension: 'libc10_cuda.so: cannot open shared object file: No such file or directory'If you don't plan on using image functionality from `torchvision.io`, you can ignore this warning. Otherwise, there might be something wrong with your environment. Did you have `libjpeg` or `libpng` installed before building `torchvision` from source? warn( /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages/torchvision/io/image.py:13: UserWarning: Failed to load image Python extension: 'libc10_cuda.so: cannot open shared object file: No such file or directory'If you don't plan on using image functionality from `torchvision.io`, you can ignore this warning. Otherwise, there might be something wrong with your environment. Did you have `libjpeg` or `libpng` installed before building `torchvision` from source? warn( /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages/torchvision/io/image.py:13: UserWarning: Failed to load image Python extension: 'libc10_cuda.so: cannot open shared object file: No such file or directory'If you don't plan on using image functionality from `torchvision.io`, you can ignore this warning. Otherwise, there might be something wrong with your environment. Did you have `libjpeg` or `libpng` installed before building `torchvision` from source? warn( /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages/torchvision/io/image.py:13: UserWarning: Failed to load image Python extension: 'libc10_cuda.so: cannot open shared object file: No such file or directory'If you don't plan on using image functionality from `torchvision.io`, you can ignore this warning. Otherwise, there might be something wrong with your environment. Did you have `libjpeg` or `libpng` installed before building `torchvision` from source? warn( /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages/torchvision/io/image.py:13: UserWarning: Failed to load image Python extension: 'libc10_cuda.so: cannot open shared object file: No such file or directory'If you don't plan on using image functionality from `torchvision.io`, you can ignore this warning. Otherwise, there might be something wrong with your environment. Did you have `libjpeg` or `libpng` installed before building `torchvision` from source? warn( /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages/torchvision/io/image.py:13: UserWarning: Failed to load image Python extension: 'libc10_cuda.so: cannot open shared object file: No such file or directory'If you don't plan on using image functionality from `torchvision.io`, you can ignore this warning. Otherwise, there might be something wrong with your environment. Did you have `libjpeg` or `libpng` installed before building `torchvision` from source? warn( /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages/torchvision/io/image.py:13: UserWarning: Failed to load image Python extension: 'libc10_cuda.so: cannot open shared object file: No such file or directory'If you don't plan on using image functionality from `torchvision.io`, you can ignore this warning. Otherwise, there might be something wrong with your environment. Did you have `libjpeg` or `libpng` installed before building `torchvision` from source? warn( /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages/torchvision/io/image.py:13: UserWarning: Failed to load image Python extension: 'libc10_cuda.so: cannot open shared object file: No such file or directory'If you don't plan on using image functionality from `torchvision.io`, you can ignore this warning. Otherwise, there might be something wrong with your environment. Did you have `libjpeg` or `libpng` installed before building `torchvision` from source? warn( /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages/torchvision/io/image.py:13: UserWarning: Failed to load image Python extension: 'libc10_cuda.so: cannot open shared object file: No such file or directory'If you don't plan on using image functionality from `torchvision.io`, you can ignore this warning. Otherwise, there might be something wrong with your environment. Did you have `libjpeg` or `libpng` installed before building `torchvision` from source? warn( /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages/torchvision/io/image.py:13: UserWarning: Failed to load image Python extension: 'libc10_cuda.so: cannot open shared object file: No such file or directory'If you don't plan on using image functionality from `torchvision.io`, you can ignore this warning. Otherwise, there might be something wrong with your environment. Did you have `libjpeg` or `libpng` installed before building `torchvision` from source? warn( /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages/torchvision/io/image.py:13: UserWarning: Failed to load image Python extension: 'libc10_cuda.so: cannot open shared object file: No such file or directory'If you don't plan on using image functionality from `torchvision.io`, you can ignore this warning. Otherwise, there might be something wrong with your environment. Did you have `libjpeg` or `libpng` installed before building `torchvision` from source? warn( /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages/torchvision/io/image.py:13: UserWarning: Failed to load image Python extension: 'libc10_cuda.so: cannot open shared object file: No such file or directory'If you don't plan on using image functionality from `torchvision.io`, you can ignore this warning. Otherwise, there might be something wrong with your environment. Did you have `libjpeg` or `libpng` installed before building `torchvision` from source? warn( /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages/torchvision/io/image.py:13: UserWarning: Failed to load image Python extension: 'libc10_cuda.so: cannot open shared object file: No such file or directory'If you don't plan on using image functionality from `torchvision.io`, you can ignore this warning. Otherwise, there might be something wrong with your environment. Did you have `libjpeg` or `libpng` installed before building `torchvision` from source? warn( /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages/torchvision/io/image.py:13: UserWarning: Failed to load image Python extension: 'libc10_cuda.so: cannot open shared object file: No such file or directory'If you don't plan on using image functionality from `torchvision.io`, you can ignore this warning. Otherwise, there might be something wrong with your environment. Did you have `libjpeg` or `libpng` installed before building `torchvision` from source? warn( /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages/torchvision/io/image.py:13: UserWarning: Failed to load image Python extension: 'libc10_cuda.so: cannot open shared object file: No such file or directory'If you don't plan on using image functionality from `torchvision.io`, you can ignore this warning. Otherwise, there might be something wrong with your environment. Did you have `libjpeg` or `libpng` installed before building `torchvision` from source? warn( [W NPUCachingAllocator.cpp:623] Warning: expandable_segments currently defaults to false. You can enable this feature by `export PYTORCH_NPU_ALLOC_CONF = expandable_segments:True`. (function operator()) [W NPUCachingAllocator.cpp:623] Warning: expandable_segments currently defaults to false. You can enable this feature by `export PYTORCH_NPU_ALLOC_CONF = expandable_segments:True`. (function operator()) [W NPUCachingAllocator.cpp:623] Warning: expandable_segments currently defaults to false. You can enable this feature by `export PYTORCH_NPU_ALLOC_CONF = expandable_segments:True`. (function operator()) [W NPUCachingAllocator.cpp:623] Warning: expandable_segments currently defaults to false. You can enable this feature by `export PYTORCH_NPU_ALLOC_CONF = expandable_segments:True`. (function operator()) [W NPUCachingAllocator.cpp:623] Warning: expandable_segments currently defaults to false. You can enable this feature by `export PYTORCH_NPU_ALLOC_CONF = expandable_segments:True`. (function operator()) [W NPUCachingAllocator.cpp:623] Warning: expandable_segments currently defaults to false. You can enable this feature by `export PYTORCH_NPU_ALLOC_CONF = expandable_segments:True`. (function operator()) [W NPUCachingAllocator.cpp:623] Warning: expandable_segments currently defaults to false. You can enable this feature by `export PYTORCH_NPU_ALLOC_CONF = expandable_segments:True`. (function operator()) [W NPUCachingAllocator.cpp:623] Warning: expandable_segments currently defaults to false. You can enable this feature by `export PYTORCH_NPU_ALLOC_CONF = expandable_segments:True`. (function operator()) [W NPUCachingAllocator.cpp:623] Warning: expandable_segments currently defaults to false. You can enable this feature by `export PYTORCH_NPU_ALLOC_CONF = expandable_segments:True`. (function operator()) [W NPUCachingAllocator.cpp:623] Warning: expandable_segments currently defaults to false. You can enable this feature by `export PYTORCH_NPU_ALLOC_CONF = expandable_segments:True`. (function operator()) [W NPUCachingAllocator.cpp:623] Warning: expandable_segments currently defaults to false. You can enable this feature by `export PYTORCH_NPU_ALLOC_CONF = expandable_segments:True`. (function operator()) [W NPUCachingAllocator.cpp:623] Warning: expandable_segments currently defaults to false. You can enable this feature by `export PYTORCH_NPU_ALLOC_CONF = expandable_segments:True`. (function operator()) [W NPUCachingAllocator.cpp:623] Warning: expandable_segments currently defaults to false. You can enable this feature by `export PYTORCH_NPU_ALLOC_CONF = expandable_segments:True`. (function operator()) [W NPUCachingAllocator.cpp:623] Warning: expandable_segments currently defaults to false. You can enable this feature by `export PYTORCH_NPU_ALLOC_CONF = expandable_segments:True`. (function operator()) [W NPUCachingAllocator.cpp:623] Warning: expandable_segments currently defaults to false. You can enable this feature by `export PYTORCH_NPU_ALLOC_CONF = expandable_segments:True`. (function operator()) [W NPUCachingAllocator.cpp:623] Warning: expandable_segments currently defaults to false. You can enable this feature by `export PYTORCH_NPU_ALLOC_CONF = expandable_segments:True`. (function operator()) [W ProcessGroupHCCL.cpp:652] Warning: The HCCL execution timeout 7200000ms is bigger than watchdog timeout 1800000ms which is set by init_process_group! The plog may not be recorded. (function ProcessGroupHCCL) [W ProcessGroupHCCL.cpp:652] Warning: The HCCL execution timeout 7200000ms is bigger than watchdog timeout 1800000ms which is set by init_process_group! The plog may not be recorded. (function ProcessGroupHCCL) [W ProcessGroupHCCL.cpp:652] Warning: The HCCL execution timeout 7200000ms is bigger than watchdog timeout 1800000ms which is set by init_process_group! The plog may not be recorded. (function ProcessGroupHCCL) [W ProcessGroupHCCL.cpp:652] Warning: The HCCL execution timeout 7200000ms is bigger than watchdog timeout 1800000ms which is set by init_process_group! The plog may not be recorded. (function ProcessGroupHCCL) [W ProcessGroupHCCL.cpp:652] Warning: The HCCL execution timeout 7200000ms is bigger than watchdog timeout 1800000ms which is set by init_process_group! The plog may not be recorded. (function ProcessGroupHCCL) [W ProcessGroupHCCL.cpp:652] Warning: The HCCL execution timeout 7200000ms is bigger than watchdog timeout 1800000ms which is set by init_process_group! The plog may not be recorded. (function ProcessGroupHCCL) [W ProcessGroupHCCL.cpp:652] Warning: The HCCL execution timeout 7200000ms is bigger than watchdog timeout 1800000ms which is set by init_process_group! The plog may not be recorded. (function ProcessGroupHCCL) [W ProcessGroupHCCL.cpp:652] Warning: The HCCL execution timeout 7200000ms is bigger than watchdog timeout 1800000ms which is set by init_process_group! The plog may not be recorded. (function ProcessGroupHCCL) [W ProcessGroupHCCL.cpp:652] Warning: The HCCL execution timeout 7200000ms is bigger than watchdog timeout 1800000ms which is set by init_process_group! The plog may not be recorded. (function ProcessGroupHCCL) [W ProcessGroupHCCL.cpp:652] Warning: The HCCL execution timeout 7200000ms is bigger than watchdog timeout 1800000ms which is set by init_process_group! The plog may not be recorded. (function ProcessGroupHCCL) [W ProcessGroupHCCL.cpp:652] Warning: The HCCL execution timeout 7200000ms is bigger than watchdog timeout 1800000ms which is set by init_process_group! The plog may not be recorded. (function ProcessGroupHCCL) [W ProcessGroupHCCL.cpp:652] Warning: The HCCL execution timeout 7200000ms is bigger than watchdog timeout 1800000ms which is set by init_process_group! The plog may not be recorded. (function ProcessGroupHCCL) [W ProcessGroupHCCL.cpp:652] Warning: The HCCL execution timeout 7200000ms is bigger than watchdog timeout 1800000ms which is set by init_process_group! The plog may not be recorded. (function ProcessGroupHCCL) [W ProcessGroupHCCL.cpp:652] Warning: The HCCL execution timeout 7200000ms is bigger than watchdog timeout 1800000ms which is set by init_process_group! The plog may not be recorded. (function ProcessGroupHCCL) [W ProcessGroupHCCL.cpp:652] Warning: The HCCL execution timeout 7200000ms is bigger than watchdog timeout 1800000ms which is set by init_process_group! The plog may not be recorded. (function ProcessGroupHCCL) [W ProcessGroupHCCL.cpp:652] Warning: The HCCL execution timeout 7200000ms is bigger than watchdog timeout 1800000ms which is set by init_process_group! The plog may not be recorded. (function ProcessGroupHCCL) > compiling dataset index builder ... [W ProcessGroupHCCL.cpp:652] Warning: The HCCL execution timeout 7200000ms is bigger than watchdog timeout 1800000ms which is set by init_process_group! The plog may not be recorded. (function ProcessGroupHCCL) [W ProcessGroupHCCL.cpp:652] Warning: The HCCL execution timeout 7200000ms is bigger than watchdog timeout 1800000ms which is set by init_process_group! The plog may not be recorded. (function ProcessGroupHCCL) [W ProcessGroupHCCL.cpp:652] Warning: The HCCL execution timeout 7200000ms is bigger than watchdog timeout 1800000ms which is set by init_process_group! The plog may not be recorded. (function ProcessGroupHCCL) [W ProcessGroupHCCL.cpp:652] Warning: The HCCL execution timeout 7200000ms is bigger than watchdog timeout 1800000ms which is set by init_process_group! The plog may not be recorded. (function ProcessGroupHCCL) [W ProcessGroupHCCL.cpp:652] Warning: The HCCL execution timeout 7200000ms is bigger than watchdog timeout 1800000ms which is set by init_process_group! The plog may not be recorded. (function ProcessGroupHCCL) [W ProcessGroupHCCL.cpp:652] Warning: The HCCL execution timeout 7200000ms is bigger than watchdog timeout 1800000ms which is set by init_process_group! The plog may not be recorded. (function ProcessGroupHCCL) [W ProcessGroupHCCL.cpp:652] Warning: The HCCL execution timeout 7200000ms is bigger than watchdog timeout 1800000ms which is set by init_process_group! The plog may not be recorded. (function ProcessGroupHCCL) [W ProcessGroupHCCL.cpp:652] Warning: The HCCL execution timeout 7200000ms is bigger than watchdog timeout 1800000ms which is set by init_process_group! The plog may not be recorded. (function ProcessGroupHCCL) [W ProcessGroupHCCL.cpp:652] Warning: The HCCL execution timeout 7200000ms is bigger than watchdog timeout 1800000ms which is set by init_process_group! The plog may not be recorded. (function ProcessGroupHCCL) [W ProcessGroupHCCL.cpp:652] Warning: The HCCL execution timeout 7200000ms is bigger than watchdog timeout 1800000ms which is set by init_process_group! The plog may not be recorded. (function ProcessGroupHCCL) [W ProcessGroupHCCL.cpp:652] Warning: The HCCL execution timeout 7200000ms is bigger than watchdog timeout 1800000ms which is set by init_process_group! The plog may not be recorded. (function ProcessGroupHCCL) [W ProcessGroupHCCL.cpp:652] Warning: The HCCL execution timeout 7200000ms is bigger than watchdog timeout 1800000ms which is set by init_process_group! The plog may not be recorded. (function ProcessGroupHCCL) make: Entering directory 'local_disk/cognitron_vl/third_party/Megatron-LM_core_r0.6.0/megatron/core/datasets' [W ProcessGroupHCCL.cpp:652] Warning: The HCCL execution timeout 7200000ms is bigger than watchdog timeout 1800000ms which is set by init_process_group! The plog may not be recorded. (function ProcessGroupHCCL) [W ProcessGroupHCCL.cpp:652] Warning: The HCCL execution timeout 7200000ms is bigger than watchdog timeout 1800000ms which is set by init_process_group! The plog may not be recorded. (function ProcessGroupHCCL) [W ProcessGroupHCCL.cpp:652] Warning: The HCCL execution timeout 7200000ms is bigger than watchdog timeout 1800000ms which is set by init_process_group! The plog may not be recorded. (function ProcessGroupHCCL) [W ProcessGroupHCCL.cpp:652] Warning: The HCCL execution timeout 7200000ms is bigger than watchdog timeout 1800000ms which is set by init_process_group! The plog may not be recorded. (function ProcessGroupHCCL) make: Nothing to be done for 'default'. make: Leaving directory 'local_disk/cognitron_vl/third_party/Megatron-LM_core_r0.6.0/megatron/core/datasets' >>> done with dataset index builder. Compilation time: 4.325 seconds vision_projection_recompute False vision_projection_recompute False vision_projection_recompute False vision_projection_recompute False vision_projection_recompute False vision_projection_recompute False vision_projection_recompute False vision_projection_recompute False vision_projection_recompute False vision_projection_recompute False vision_projection_recompute False vision_projection_recompute False vision_projection_recompute False vision_projection_recompute False vision_projection_recompute False vision_projection_recompute False model GPTVLModel( (external_feature_model): MegatronVisionModel( (vit): InternViTModel( (conv1): Conv2d(3, 1024, kernel_size=(14, 14), stride=(14, 14)) (position_embeddings): Embedding(1025, 1024) (decoder): TransformerBlock( (layers): ModuleList( (0-23): 24 x InternViTTransformerLayer( (input_layernorm): LayerNorm((1024,), eps=1e-06, elementwise_affine=True) (self_attention): SelfAttention( (core_attention): DotProductAttention( (scale_mask_softmax): FusedScaleMaskSoftmax() (attention_dropout): Dropout(p=0.0, inplace=False) ) (linear_proj): RowParallelLinear() (linear_qkv): ColumnParallelLinear() ) (self_attn_bda): IdentityFuncOp() (pre_cross_attn_layernorm): IdentityOp() (cross_attention): IdentityOp() (cross_attn_bda): IdentityFuncOp() (pre_mlp_layernorm): LayerNorm((1024,), eps=1e-06, elementwise_affine=True) (mlp): MLP( (linear_fc1): ColumnParallelLinear() (linear_fc2): RowParallelLinear() ) (mlp_bda): IdentityFuncOp() ) ) ) ) (vision_projection): MultimodalProjector( (encoder): MLP( (linear_fc1): ColumnParallelLinear() (linear_fc2): RowParallelLinear() ) ) (pre_proj_layernorm): LayerNorm((4096,), eps=1e-05, elementwise_affine=True) ) (embedding): LanguageModelEmbedding( (word_embeddings): VocabParallelEmbedding() (embedding_dropout): Dropout(p=0.0, inplace=False) ) (rotary_pos_emb): RotaryEmbedding() (decoder): TransformerBlock( (layers): ModuleList( (0-47): 48 x TransformerLayer( (input_layernorm): RMSNorm() (self_attention): SelfAttention( (core_attention): DotProductAttention( (scale_mask_softmax): FusedScaleMaskSoftmax() (attention_dropout): Dropout(p=0.0, inplace=False) ) (linear_proj): RowParallelLinear() (linear_qkv): ColumnParallelLinear() (q_layernorm): IdentityOp() (k_layernorm): IdentityOp() ) (pre_cross_attn_layernorm): IdentityOp() (cross_attention): IdentityOp() (cross_attn_bda): IdentityFuncOp() (pre_mlp_layernorm): RMSNorm() (mlp): MLP( (linear_fc1): ColumnParallelLinear() (linear_fc2): RowParallelLinear() ) ) ) (final_layernorm): RMSNorm() ) (output_layer): ColumnParallelLinear() ) model GPTVLModel( (external_feature_model): MegatronVisionModel( (vit): InternViTModel( (conv1): Conv2d(3, 1024, kernel_size=(14, 14), stride=(14, 14)) (position_embeddings): Embedding(1025, 1024) (decoder): TransformerBlock( (layers): ModuleList( (0-23): 24 x InternViTTransformerLayer( (input_layernorm): LayerNorm((1024,), eps=1e-06, elementwise_affine=True) (self_attention): SelfAttention( (core_attention): DotProductAttention( (scale_mask_softmax): FusedScaleMaskSoftmax() (attention_dropout): Dropout(p=0.0, inplace=False) ) (linear_proj): RowParallelLinear() (linear_qkv): ColumnParallelLinear() ) (self_attn_bda): IdentityFuncOp() (pre_cross_attn_layernorm): IdentityOp() (cross_attention): IdentityOp() (cross_attn_bda): IdentityFuncOp() (pre_mlp_layernorm): LayerNorm((1024,), eps=1e-06, elementwise_affine=True) (mlp): MLP( (linear_fc1): ColumnParallelLinear() (linear_fc2): RowParallelLinear() ) (mlp_bda): IdentityFuncOp() ) ) ) ) (vision_projection): MultimodalProjector( (encoder): MLP( (linear_fc1): ColumnParallelLinear() (linear_fc2): RowParallelLinear() ) ) (pre_proj_layernorm): LayerNorm((4096,), eps=1e-05, elementwise_affine=True) ) (embedding): LanguageModelEmbedding( (word_embeddings): VocabParallelEmbedding() (embedding_dropout): Dropout(p=0.0, inplace=False) ) (rotary_pos_emb): RotaryEmbedding() (decoder): TransformerBlock( (layers): ModuleList( (0-47): 48 x TransformerLayer( (input_layernorm): RMSNorm() (self_attention): SelfAttention( (core_attention): DotProductAttention( (scale_mask_softmax): FusedScaleMaskSoftmax() (attention_dropout): Dropout(p=0.0, inplace=False) ) (linear_proj): RowParallelLinear() (linear_qkv): ColumnParallelLinear() (q_layernorm): IdentityOp() (k_layernorm): IdentityOp() ) (pre_cross_attn_layernorm): IdentityOp() (cross_attention): IdentityOp() (cross_attn_bda): IdentityFuncOp() (pre_mlp_layernorm): RMSNorm() (mlp): MLP( (linear_fc1): ColumnParallelLinear() (linear_fc2): RowParallelLinear() ) ) ) (final_layernorm): RMSNorm() ) (output_layer): ColumnParallelLinear() ) model GPTVLModel( (external_feature_model): MegatronVisionModel( (vit): InternViTModel( (conv1): Conv2d(3, 1024, kernel_size=(14, 14), stride=(14, 14)) (position_embeddings): Embedding(1025, 1024) (decoder): TransformerBlock( (layers): ModuleList( (0-23): 24 x InternViTTransformerLayer( (input_layernorm): LayerNorm((1024,), eps=1e-06, elementwise_affine=True) (self_attention): SelfAttention( (core_attention): DotProductAttention( (scale_mask_softmax): FusedScaleMaskSoftmax() (attention_dropout): Dropout(p=0.0, inplace=False) ) (linear_proj): RowParallelLinear() (linear_qkv): ColumnParallelLinear() ) (self_attn_bda): IdentityFuncOp() (pre_cross_attn_layernorm): IdentityOp() (cross_attention): IdentityOp() (cross_attn_bda): IdentityFuncOp() (pre_mlp_layernorm): LayerNorm((1024,), eps=1e-06, elementwise_affine=True) (mlp): MLP( (linear_fc1): ColumnParallelLinear() (linear_fc2): RowParallelLinear() ) (mlp_bda): IdentityFuncOp() ) ) ) ) (vision_projection): MultimodalProjector( (encoder): MLP( (linear_fc1): ColumnParallelLinear() (linear_fc2): RowParallelLinear() ) ) (pre_proj_layernorm): LayerNorm((4096,), eps=1e-05, elementwise_affine=True) ) (embedding): LanguageModelEmbedding( (word_embeddings): VocabParallelEmbedding() (embedding_dropout): Dropout(p=0.0, inplace=False) ) (rotary_pos_emb): RotaryEmbedding() (decoder): TransformerBlock( (layers): ModuleList( (0-47): 48 x TransformerLayer( (input_layernorm): RMSNorm() (self_attention): SelfAttention( (core_attention): DotProductAttention( (scale_mask_softmax): FusedScaleMaskSoftmax() (attention_dropout): Dropout(p=0.0, inplace=False) ) (linear_proj): RowParallelLinear() (linear_qkv): ColumnParallelLinear() (q_layernorm): IdentityOp() (k_layernorm): IdentityOp() ) (pre_cross_attn_layernorm): IdentityOp() (cross_attention): IdentityOp() (cross_attn_bda): IdentityFuncOp() (pre_mlp_layernorm): RMSNorm() (mlp): MLP( (linear_fc1): ColumnParallelLinear() (linear_fc2): RowParallelLinear() ) ) ) (final_layernorm): RMSNorm() ) (output_layer): ColumnParallelLinear() ) model GPTVLModel( (external_feature_model): MegatronVisionModel( (vit): InternViTModel( (conv1): Conv2d(3, 1024, kernel_size=(14, 14), stride=(14, 14)) (position_embeddings): Embedding(1025, 1024) (decoder): TransformerBlock( (layers): ModuleList( (0-23): 24 x InternViTTransformerLayer( (input_layernorm): LayerNorm((1024,), eps=1e-06, elementwise_affine=True) (self_attention): SelfAttention( (core_attention): DotProductAttention( (scale_mask_softmax): FusedScaleMaskSoftmax() (attention_dropout): Dropout(p=0.0, inplace=False) ) (linear_proj): RowParallelLinear() (linear_qkv): ColumnParallelLinear() ) (self_attn_bda): IdentityFuncOp() (pre_cross_attn_layernorm): IdentityOp() (cross_attention): IdentityOp() (cross_attn_bda): IdentityFuncOp() (pre_mlp_layernorm): LayerNorm((1024,), eps=1e-06, elementwise_affine=True) (mlp): MLP( (linear_fc1): ColumnParallelLinear() (linear_fc2): RowParallelLinear() ) (mlp_bda): IdentityFuncOp() ) ) ) ) (vision_projection): MultimodalProjector( (encoder): MLP( (linear_fc1): ColumnParallelLinear() (linear_fc2): RowParallelLinear() ) ) (pre_proj_layernorm): LayerNorm((4096,), eps=1e-05, elementwise_affine=True) ) (embedding): LanguageModelEmbedding( (word_embeddings): VocabParallelEmbedding() (embedding_dropout): Dropout(p=0.0, inplace=False) ) (rotary_pos_emb): RotaryEmbedding() (decoder): TransformerBlock( (layers): ModuleList( (0-47): 48 x TransformerLayer( (input_layernorm): RMSNorm() (self_attention): SelfAttention( (core_attention): DotProductAttention( (scale_mask_softmax): FusedScaleMaskSoftmax() (attention_dropout): Dropout(p=0.0, inplace=False) ) (linear_proj): RowParallelLinear() (linear_qkv): ColumnParallelLinear() (q_layernorm): IdentityOp() (k_layernorm): IdentityOp() ) (pre_cross_attn_layernorm): IdentityOp() (cross_attention): IdentityOp() (cross_attn_bda): IdentityFuncOp() (pre_mlp_layernorm): RMSNorm() (mlp): MLP( (linear_fc1): ColumnParallelLinear() (linear_fc2): RowParallelLinear() ) ) ) (final_layernorm): RMSNorm() ) (output_layer): ColumnParallelLinear() ) model GPTVLModel( (external_feature_model): MegatronVisionModel( (vit): InternViTModel( (conv1): Conv2d(3, 1024, kernel_size=(14, 14), stride=(14, 14)) (position_embeddings): Embedding(1025, 1024) (decoder): TransformerBlock( (layers): ModuleList( (0-23): 24 x InternViTTransformerLayer( (input_layernorm): LayerNorm((1024,), eps=1e-06, elementwise_affine=True) (self_attention): SelfAttention( (core_attention): DotProductAttention( (scale_mask_softmax): FusedScaleMaskSoftmax() (attention_dropout): Dropout(p=0.0, inplace=False) ) (linear_proj): RowParallelLinear() (linear_qkv): ColumnParallelLinear() ) (self_attn_bda): IdentityFuncOp() (pre_cross_attn_layernorm): IdentityOp() (cross_attention): IdentityOp() (cross_attn_bda): IdentityFuncOp() (pre_mlp_layernorm): LayerNorm((1024,), eps=1e-06, elementwise_affine=True) (mlp): MLP( (linear_fc1): ColumnParallelLinear() (linear_fc2): RowParallelLinear() ) (mlp_bda): IdentityFuncOp() ) ) ) ) (vision_projection): MultimodalProjector( (encoder): MLP( (linear_fc1): ColumnParallelLinear() (linear_fc2): RowParallelLinear() ) ) (pre_proj_layernorm): LayerNorm((4096,), eps=1e-05, elementwise_affine=True) ) (embedding): LanguageModelEmbedding( (word_embeddings): VocabParallelEmbedding() (embedding_dropout): Dropout(p=0.0, inplace=False) ) (rotary_pos_emb): RotaryEmbedding() (decoder): TransformerBlock( (layers): ModuleList( (0-47): 48 x TransformerLayer( (input_layernorm): RMSNorm() (self_attention): SelfAttention( (core_attention): DotProductAttention( (scale_mask_softmax): FusedScaleMaskSoftmax() (attention_dropout): Dropout(p=0.0, inplace=False) ) (linear_proj): RowParallelLinear() (linear_qkv): ColumnParallelLinear() (q_layernorm): IdentityOp() (k_layernorm): IdentityOp() ) (pre_cross_attn_layernorm): IdentityOp() (cross_attention): IdentityOp() (cross_attn_bda): IdentityFuncOp() (pre_mlp_layernorm): RMSNorm() (mlp): MLP( (linear_fc1): ColumnParallelLinear() (linear_fc2): RowParallelLinear() ) ) ) (final_layernorm): RMSNorm() ) (output_layer): ColumnParallelLinear() ) model GPTVLModel( (external_feature_model): MegatronVisionModel( (vit): InternViTModel( (conv1): Conv2d(3, 1024, kernel_size=(14, 14), stride=(14, 14)) (position_embeddings): Embedding(1025, 1024) (decoder): TransformerBlock( (layers): ModuleList( (0-23): 24 x InternViTTransformerLayer( (input_layernorm): LayerNorm((1024,), eps=1e-06, elementwise_affine=True) (self_attention): SelfAttention( (core_attention): DotProductAttention( (scale_mask_softmax): FusedScaleMaskSoftmax() (attention_dropout): Dropout(p=0.0, inplace=False) ) (linear_proj): RowParallelLinear() (linear_qkv): ColumnParallelLinear() ) (self_attn_bda): IdentityFuncOp() (pre_cross_attn_layernorm): IdentityOp() (cross_attention): IdentityOp() (cross_attn_bda): IdentityFuncOp() (pre_mlp_layernorm): LayerNorm((1024,), eps=1e-06, elementwise_affine=True) (mlp): MLP( (linear_fc1): ColumnParallelLinear() (linear_fc2): RowParallelLinear() ) (mlp_bda): IdentityFuncOp() ) ) ) ) (vision_projection): MultimodalProjector( (encoder): MLP( (linear_fc1): ColumnParallelLinear() (linear_fc2): RowParallelLinear() ) ) (pre_proj_layernorm): LayerNorm((4096,), eps=1e-05, elementwise_affine=True) ) (embedding): LanguageModelEmbedding( (word_embeddings): VocabParallelEmbedding() (embedding_dropout): Dropout(p=0.0, inplace=False) ) (rotary_pos_emb): RotaryEmbedding() (decoder): TransformerBlock( (layers): ModuleList( (0-47): 48 x TransformerLayer( (input_layernorm): RMSNorm() (self_attention): SelfAttention( (core_attention): DotProductAttention( (scale_mask_softmax): FusedScaleMaskSoftmax() (attention_dropout): Dropout(p=0.0, inplace=False) ) (linear_proj): RowParallelLinear() (linear_qkv): ColumnParallelLinear() (q_layernorm): IdentityOp() (k_layernorm): IdentityOp() ) (pre_cross_attn_layernorm): IdentityOp() (cross_attention): IdentityOp() (cross_attn_bda): IdentityFuncOp() (pre_mlp_layernorm): RMSNorm() (mlp): MLP( (linear_fc1): ColumnParallelLinear() (linear_fc2): RowParallelLinear() ) ) ) (final_layernorm): RMSNorm() ) (output_layer): ColumnParallelLinear() ) model GPTVLModel( (external_feature_model): MegatronVisionModel( (vit): InternViTModel( (conv1): Conv2d(3, 1024, kernel_size=(14, 14), stride=(14, 14)) (position_embeddings): Embedding(1025, 1024) (decoder): TransformerBlock( (layers): ModuleList( (0-23): 24 x InternViTTransformerLayer( (input_layernorm): LayerNorm((1024,), eps=1e-06, elementwise_affine=True) (self_attention): SelfAttention( (core_attention): DotProductAttention( (scale_mask_softmax): FusedScaleMaskSoftmax() (attention_dropout): Dropout(p=0.0, inplace=False) ) (linear_proj): RowParallelLinear() (linear_qkv): ColumnParallelLinear() ) (self_attn_bda): IdentityFuncOp() (pre_cross_attn_layernorm): IdentityOp() (cross_attention): IdentityOp() (cross_attn_bda): IdentityFuncOp() (pre_mlp_layernorm): LayerNorm((1024,), eps=1e-06, elementwise_affine=True) (mlp): MLP( (linear_fc1): ColumnParallelLinear() (linear_fc2): RowParallelLinear() ) (mlp_bda): IdentityFuncOp() ) ) ) ) (vision_projection): MultimodalProjector( (encoder): MLP( (linear_fc1): ColumnParallelLinear() (linear_fc2): RowParallelLinear() ) ) (pre_proj_layernorm): LayerNorm((4096,), eps=1e-05, elementwise_affine=True) ) (embedding): LanguageModelEmbedding( (word_embeddings): VocabParallelEmbedding() (embedding_dropout): Dropout(p=0.0, inplace=False) ) (rotary_pos_emb): RotaryEmbedding() (decoder): TransformerBlock( (layers): ModuleList( (0-47): 48 x TransformerLayer( (input_layernorm): RMSNorm() (self_attention): SelfAttention( (core_attention): DotProductAttention( (scale_mask_softmax): FusedScaleMaskSoftmax() (attention_dropout): Dropout(p=0.0, inplace=False) ) (linear_proj): RowParallelLinear() (linear_qkv): ColumnParallelLinear() (q_layernorm): IdentityOp() (k_layernorm): IdentityOp() ) (pre_cross_attn_layernorm): IdentityOp() (cross_attention): IdentityOp() (cross_attn_bda): IdentityFuncOp() (pre_mlp_layernorm): RMSNorm() (mlp): MLP( (linear_fc1): ColumnParallelLinear() (linear_fc2): RowParallelLinear() ) ) ) (final_layernorm): RMSNorm() ) (output_layer): ColumnParallelLinear() ) model GPTVLModel( (external_feature_model): MegatronVisionModel( (vit): InternViTModel( (conv1): Conv2d(3, 1024, kernel_size=(14, 14), stride=(14, 14)) (position_embeddings): Embedding(1025, 1024) (decoder): TransformerBlock( (layers): ModuleList( (0-23): 24 x InternViTTransformerLayer( (input_layernorm): LayerNorm((1024,), eps=1e-06, elementwise_affine=True) (self_attention): SelfAttention( (core_attention): DotProductAttention( (scale_mask_softmax): FusedScaleMaskSoftmax() (attention_dropout): Dropout(p=0.0, inplace=False) ) (linear_proj): RowParallelLinear() (linear_qkv): ColumnParallelLinear() ) (self_attn_bda): IdentityFuncOp() (pre_cross_attn_layernorm): IdentityOp() (cross_attention): IdentityOp() (cross_attn_bda): IdentityFuncOp() (pre_mlp_layernorm): LayerNorm((1024,), eps=1e-06, elementwise_affine=True) (mlp): MLP( (linear_fc1): ColumnParallelLinear() (linear_fc2): RowParallelLinear() ) (mlp_bda): IdentityFuncOp() ) ) ) ) (vision_projection): MultimodalProjector( (encoder): MLP( (linear_fc1): ColumnParallelLinear() (linear_fc2): RowParallelLinear() ) ) (pre_proj_layernorm): LayerNorm((4096,), eps=1e-05, elementwise_affine=True) ) (embedding): LanguageModelEmbedding( (word_embeddings): VocabParallelEmbedding() (embedding_dropout): Dropout(p=0.0, inplace=False) ) (rotary_pos_emb): RotaryEmbedding() (decoder): TransformerBlock( (layers): ModuleList( (0-47): 48 x TransformerLayer( (input_layernorm): RMSNorm() (self_attention): SelfAttention( (core_attention): DotProductAttention( (scale_mask_softmax): FusedScaleMaskSoftmax() (attention_dropout): Dropout(p=0.0, inplace=False) ) (linear_proj): RowParallelLinear() (linear_qkv): ColumnParallelLinear() (q_layernorm): IdentityOp() (k_layernorm): IdentityOp() ) (pre_cross_attn_layernorm): IdentityOp() (cross_attention): IdentityOp() (cross_attn_bda): IdentityFuncOp() (pre_mlp_layernorm): RMSNorm() (mlp): MLP( (linear_fc1): ColumnParallelLinear() (linear_fc2): RowParallelLinear() ) ) ) (final_layernorm): RMSNorm() ) (output_layer): ColumnParallelLinear() ) model GPTVLModel( (external_feature_model): MegatronVisionModel( (vit): InternViTModel( (conv1): Conv2d(3, 1024, kernel_size=(14, 14), stride=(14, 14)) (position_embeddings): Embedding(1025, 1024) (decoder): TransformerBlock( (layers): ModuleList( (0-23): 24 x InternViTTransformerLayer( (input_layernorm): LayerNorm((1024,), eps=1e-06, elementwise_affine=True) (self_attention): SelfAttention( (core_attention): DotProductAttention( (scale_mask_softmax): FusedScaleMaskSoftmax() (attention_dropout): Dropout(p=0.0, inplace=False) ) (linear_proj): RowParallelLinear() (linear_qkv): ColumnParallelLinear() ) (self_attn_bda): IdentityFuncOp() (pre_cross_attn_layernorm): IdentityOp() (cross_attention): IdentityOp() (cross_attn_bda): IdentityFuncOp() (pre_mlp_layernorm): LayerNorm((1024,), eps=1e-06, elementwise_affine=True) (mlp): MLP( (linear_fc1): ColumnParallelLinear() (linear_fc2): RowParallelLinear() ) (mlp_bda): IdentityFuncOp() ) ) ) ) (vision_projection): MultimodalProjector( (encoder): MLP( (linear_fc1): ColumnParallelLinear() (linear_fc2): RowParallelLinear() ) ) (pre_proj_layernorm): LayerNorm((4096,), eps=1e-05, elementwise_affine=True) ) (embedding): LanguageModelEmbedding( (word_embeddings): VocabParallelEmbedding() (embedding_dropout): Dropout(p=0.0, inplace=False) ) (rotary_pos_emb): RotaryEmbedding() (decoder): TransformerBlock( (layers): ModuleList( (0-47): 48 x TransformerLayer( (input_layernorm): RMSNorm() (self_attention): SelfAttention( (core_attention): DotProductAttention( (scale_mask_softmax): FusedScaleMaskSoftmax() (attention_dropout): Dropout(p=0.0, inplace=False) ) (linear_proj): RowParallelLinear() (linear_qkv): ColumnParallelLinear() (q_layernorm): IdentityOp() (k_layernorm): IdentityOp() ) (pre_cross_attn_layernorm): IdentityOp() (cross_attention): IdentityOp() (cross_attn_bda): IdentityFuncOp() (pre_mlp_layernorm): RMSNorm() (mlp): MLP( (linear_fc1): ColumnParallelLinear() (linear_fc2): RowParallelLinear() ) ) ) (final_layernorm): RMSNorm() ) (output_layer): ColumnParallelLinear() ) model GPTVLModel( (external_feature_model): MegatronVisionModel( (vit): InternViTModel( (conv1): Conv2d(3, 1024, kernel_size=(14, 14), stride=(14, 14)) (position_embeddings): Embedding(1025, 1024) (decoder): TransformerBlock( (layers): ModuleList( (0-23): 24 x InternViTTransformerLayer( (input_layernorm): LayerNorm((1024,), eps=1e-06, elementwise_affine=True) (self_attention): SelfAttention( (core_attention): DotProductAttention( (scale_mask_softmax): FusedScaleMaskSoftmax() (attention_dropout): Dropout(p=0.0, inplace=False) ) (linear_proj): RowParallelLinear() (linear_qkv): ColumnParallelLinear() ) (self_attn_bda): IdentityFuncOp() (pre_cross_attn_layernorm): IdentityOp() (cross_attention): IdentityOp() (cross_attn_bda): IdentityFuncOp() (pre_mlp_layernorm): LayerNorm((1024,), eps=1e-06, elementwise_affine=True) (mlp): MLP( (linear_fc1): ColumnParallelLinear() (linear_fc2): RowParallelLinear() ) (mlp_bda): IdentityFuncOp() ) ) ) ) (vision_projection): MultimodalProjector( (encoder): MLP( (linear_fc1): ColumnParallelLinear() (linear_fc2): RowParallelLinear() ) ) (pre_proj_layernorm): LayerNorm((4096,), eps=1e-05, elementwise_affine=True) ) (embedding): LanguageModelEmbedding( (word_embeddings): VocabParallelEmbedding() (embedding_dropout): Dropout(p=0.0, inplace=False) ) (rotary_pos_emb): RotaryEmbedding() (decoder): TransformerBlock( (layers): ModuleList( (0-47): 48 x TransformerLayer( (input_layernorm): RMSNorm() (self_attention): SelfAttention( (core_attention): DotProductAttention( (scale_mask_softmax): FusedScaleMaskSoftmax() (attention_dropout): Dropout(p=0.0, inplace=False) ) (linear_proj): RowParallelLinear() (linear_qkv): ColumnParallelLinear() (q_layernorm): IdentityOp() (k_layernorm): IdentityOp() ) (pre_cross_attn_layernorm): IdentityOp() (cross_attention): IdentityOp() (cross_attn_bda): IdentityFuncOp() (pre_mlp_layernorm): RMSNorm() (mlp): MLP( (linear_fc1): ColumnParallelLinear() (linear_fc2): RowParallelLinear() ) ) ) (final_layernorm): RMSNorm() ) (output_layer): ColumnParallelLinear() ) model GPTVLModel( (external_feature_model): MegatronVisionModel( (vit): InternViTModel( (conv1): Conv2d(3, 1024, kernel_size=(14, 14), stride=(14, 14)) (position_embeddings): Embedding(1025, 1024) (decoder): TransformerBlock( (layers): ModuleList( (0-23): 24 x InternViTTransformerLayer( (input_layernorm): LayerNorm((1024,), eps=1e-06, elementwise_affine=True) (self_attention): SelfAttention( (core_attention): DotProductAttention( (scale_mask_softmax): FusedScaleMaskSoftmax() (attention_dropout): Dropout(p=0.0, inplace=False) ) (linear_proj): RowParallelLinear() (linear_qkv): ColumnParallelLinear() ) (self_attn_bda): IdentityFuncOp() (pre_cross_attn_layernorm): IdentityOp() (cross_attention): IdentityOp() (cross_attn_bda): IdentityFuncOp() (pre_mlp_layernorm): LayerNorm((1024,), eps=1e-06, elementwise_affine=True) (mlp): MLP( (linear_fc1): ColumnParallelLinear() (linear_fc2): RowParallelLinear() ) (mlp_bda): IdentityFuncOp() ) ) ) ) (vision_projection): MultimodalProjector( (encoder): MLP( (linear_fc1): ColumnParallelLinear() (linear_fc2): RowParallelLinear() ) ) (pre_proj_layernorm): LayerNorm((4096,), eps=1e-05, elementwise_affine=True) ) (embedding): LanguageModelEmbedding( (word_embeddings): VocabParallelEmbedding() (embedding_dropout): Dropout(p=0.0, inplace=False) ) (rotary_pos_emb): RotaryEmbedding() (decoder): TransformerBlock( (layers): ModuleList( (0-47): 48 x TransformerLayer( (input_layernorm): RMSNorm() (self_attention): SelfAttention( (core_attention): DotProductAttention( (scale_mask_softmax): FusedScaleMaskSoftmax() (attention_dropout): Dropout(p=0.0, inplace=False) ) (linear_proj): RowParallelLinear() (linear_qkv): ColumnParallelLinear() (q_layernorm): IdentityOp() (k_layernorm): IdentityOp() ) (pre_cross_attn_layernorm): IdentityOp() (cross_attention): IdentityOp() (cross_attn_bda): IdentityFuncOp() (pre_mlp_layernorm): RMSNorm() (mlp): MLP( (linear_fc1): ColumnParallelLinear() (linear_fc2): RowParallelLinear() ) ) ) (final_layernorm): RMSNorm() ) (output_layer): ColumnParallelLinear() ) model GPTVLModel( (external_feature_model): MegatronVisionModel( (vit): InternViTModel( (conv1): Conv2d(3, 1024, kernel_size=(14, 14), stride=(14, 14)) (position_embeddings): Embedding(1025, 1024) (decoder): TransformerBlock( (layers): ModuleList( (0-23): 24 x InternViTTransformerLayer( (input_layernorm): LayerNorm((1024,), eps=1e-06, elementwise_affine=True) (self_attention): SelfAttention( (core_attention): DotProductAttention( (scale_mask_softmax): FusedScaleMaskSoftmax() (attention_dropout): Dropout(p=0.0, inplace=False) ) (linear_proj): RowParallelLinear() (linear_qkv): ColumnParallelLinear() ) (self_attn_bda): IdentityFuncOp() (pre_cross_attn_layernorm): IdentityOp() (cross_attention): IdentityOp() (cross_attn_bda): IdentityFuncOp() (pre_mlp_layernorm): LayerNorm((1024,), eps=1e-06, elementwise_affine=True) (mlp): MLP( (linear_fc1): ColumnParallelLinear() (linear_fc2): RowParallelLinear() ) (mlp_bda): IdentityFuncOp() ) ) ) ) (vision_projection): MultimodalProjector( (encoder): MLP( (linear_fc1): ColumnParallelLinear() (linear_fc2): RowParallelLinear() ) ) (pre_proj_layernorm): LayerNorm((4096,), eps=1e-05, elementwise_affine=True) ) (embedding): LanguageModelEmbedding( (word_embeddings): VocabParallelEmbedding() (embedding_dropout): Dropout(p=0.0, inplace=False) ) (rotary_pos_emb): RotaryEmbedding() (decoder): TransformerBlock( (layers): ModuleList( (0-47): 48 x TransformerLayer( (input_layernorm): RMSNorm() (self_attention): SelfAttention( (core_attention): DotProductAttention( (scale_mask_softmax): FusedScaleMaskSoftmax() (attention_dropout): Dropout(p=0.0, inplace=False) ) (linear_proj): RowParallelLinear() (linear_qkv): ColumnParallelLinear() (q_layernorm): IdentityOp() (k_layernorm): IdentityOp() ) (pre_cross_attn_layernorm): IdentityOp() (cross_attention): IdentityOp() (cross_attn_bda): IdentityFuncOp() (pre_mlp_layernorm): RMSNorm() (mlp): MLP( (linear_fc1): ColumnParallelLinear() (linear_fc2): RowParallelLinear() ) ) ) (final_layernorm): RMSNorm() ) (output_layer): ColumnParallelLinear() ) model GPTVLModel( (external_feature_model): MegatronVisionModel( (vit): InternViTModel( (conv1): Conv2d(3, 1024, kernel_size=(14, 14), stride=(14, 14)) (position_embeddings): Embedding(1025, 1024) (decoder): TransformerBlock( (layers): ModuleList( (0-23): 24 x InternViTTransformerLayer( (input_layernorm): LayerNorm((1024,), eps=1e-06, elementwise_affine=True) (self_attention): SelfAttention( (core_attention): DotProductAttention( (scale_mask_softmax): FusedScaleMaskSoftmax() (attention_dropout): Dropout(p=0.0, inplace=False) ) (linear_proj): RowParallelLinear() (linear_qkv): ColumnParallelLinear() ) (self_attn_bda): IdentityFuncOp() (pre_cross_attn_layernorm): IdentityOp() (cross_attention): IdentityOp() (cross_attn_bda): IdentityFuncOp() (pre_mlp_layernorm): LayerNorm((1024,), eps=1e-06, elementwise_affine=True) (mlp): MLP( (linear_fc1): ColumnParallelLinear() (linear_fc2): RowParallelLinear() ) (mlp_bda): IdentityFuncOp() ) ) ) ) (vision_projection): MultimodalProjector( (encoder): MLP( (linear_fc1): ColumnParallelLinear() (linear_fc2): RowParallelLinear() ) ) (pre_proj_layernorm): LayerNorm((4096,), eps=1e-05, elementwise_affine=True) ) (embedding): LanguageModelEmbedding( (word_embeddings): VocabParallelEmbedding() (embedding_dropout): Dropout(p=0.0, inplace=False) ) (rotary_pos_emb): RotaryEmbedding() (decoder): TransformerBlock( (layers): ModuleList( (0-47): 48 x TransformerLayer( (input_layernorm): RMSNorm() (self_attention): SelfAttention( (core_attention): DotProductAttention( (scale_mask_softmax): FusedScaleMaskSoftmax() (attention_dropout): Dropout(p=0.0, inplace=False) ) (linear_proj): RowParallelLinear() (linear_qkv): ColumnParallelLinear() (q_layernorm): IdentityOp() (k_layernorm): IdentityOp() ) (pre_cross_attn_layernorm): IdentityOp() (cross_attention): IdentityOp() (cross_attn_bda): IdentityFuncOp() (pre_mlp_layernorm): RMSNorm() (mlp): MLP( (linear_fc1): ColumnParallelLinear() (linear_fc2): RowParallelLinear() ) ) ) (final_layernorm): RMSNorm() ) (output_layer): ColumnParallelLinear() ) model GPTVLModel( (external_feature_model): MegatronVisionModel( (vit): InternViTModel( (conv1): Conv2d(3, 1024, kernel_size=(14, 14), stride=(14, 14)) (position_embeddings): Embedding(1025, 1024) (decoder): TransformerBlock( (layers): ModuleList( (0-23): 24 x InternViTTransformerLayer( (input_layernorm): LayerNorm((1024,), eps=1e-06, elementwise_affine=True) (self_attention): SelfAttention( (core_attention): DotProductAttention( (scale_mask_softmax): FusedScaleMaskSoftmax() (attention_dropout): Dropout(p=0.0, inplace=False) ) (linear_proj): RowParallelLinear() (linear_qkv): ColumnParallelLinear() ) (self_attn_bda): IdentityFuncOp() (pre_cross_attn_layernorm): IdentityOp() (cross_attention): IdentityOp() (cross_attn_bda): IdentityFuncOp() (pre_mlp_layernorm): LayerNorm((1024,), eps=1e-06, elementwise_affine=True) (mlp): MLP( (linear_fc1): ColumnParallelLinear() (linear_fc2): RowParallelLinear() ) (mlp_bda): IdentityFuncOp() ) ) ) ) (vision_projection): MultimodalProjector( (encoder): MLP( (linear_fc1): ColumnParallelLinear() (linear_fc2): RowParallelLinear() ) ) (pre_proj_layernorm): LayerNorm((4096,), eps=1e-05, elementwise_affine=True) ) (embedding): LanguageModelEmbedding( (word_embeddings): VocabParallelEmbedding() (embedding_dropout): Dropout(p=0.0, inplace=False) ) (rotary_pos_emb): RotaryEmbedding() (decoder): TransformerBlock( (layers): ModuleList( (0-47): 48 x TransformerLayer( (input_layernorm): RMSNorm() (self_attention): SelfAttention( (core_attention): DotProductAttention( (scale_mask_softmax): FusedScaleMaskSoftmax() (attention_dropout): Dropout(p=0.0, inplace=False) ) (linear_proj): RowParallelLinear() (linear_qkv): ColumnParallelLinear() (q_layernorm): IdentityOp() (k_layernorm): IdentityOp() ) (pre_cross_attn_layernorm): IdentityOp() (cross_attention): IdentityOp() (cross_attn_bda): IdentityFuncOp() (pre_mlp_layernorm): RMSNorm() (mlp): MLP( (linear_fc1): ColumnParallelLinear() (linear_fc2): RowParallelLinear() ) ) ) (final_layernorm): RMSNorm() ) (output_layer): ColumnParallelLinear() ) model GPTVLModel( (external_feature_model): MegatronVisionModel( (vit): InternViTModel( (conv1): Conv2d(3, 1024, kernel_size=(14, 14), stride=(14, 14)) (position_embeddings): Embedding(1025, 1024) (decoder): TransformerBlock( (layers): ModuleList( (0-23): 24 x InternViTTransformerLayer( (input_layernorm): LayerNorm((1024,), eps=1e-06, elementwise_affine=True) (self_attention): SelfAttention( (core_attention): DotProductAttention( (scale_mask_softmax): FusedScaleMaskSoftmax() (attention_dropout): Dropout(p=0.0, inplace=False) ) (linear_proj): RowParallelLinear() (linear_qkv): ColumnParallelLinear() ) (self_attn_bda): IdentityFuncOp() (pre_cross_attn_layernorm): IdentityOp() (cross_attention): IdentityOp() (cross_attn_bda): IdentityFuncOp() (pre_mlp_layernorm): LayerNorm((1024,), eps=1e-06, elementwise_affine=True) (mlp): MLP( (linear_fc1): ColumnParallelLinear() (linear_fc2): RowParallelLinear() ) (mlp_bda): IdentityFuncOp() ) ) ) ) (vision_projection): MultimodalProjector( (encoder): MLP( (linear_fc1): ColumnParallelLinear() (linear_fc2): RowParallelLinear() ) ) (pre_proj_layernorm): LayerNorm((4096,), eps=1e-05, elementwise_affine=True) ) (embedding): LanguageModelEmbedding( (word_embeddings): VocabParallelEmbedding() (embedding_dropout): Dropout(p=0.0, inplace=False) ) (rotary_pos_emb): RotaryEmbedding() (decoder): TransformerBlock( (layers): ModuleList( (0-47): 48 x TransformerLayer( (input_layernorm): RMSNorm() (self_attention): SelfAttention( (core_attention): DotProductAttention( (scale_mask_softmax): FusedScaleMaskSoftmax() (attention_dropout): Dropout(p=0.0, inplace=False) ) (linear_proj): RowParallelLinear() (linear_qkv): ColumnParallelLinear() (q_layernorm): IdentityOp() (k_layernorm): IdentityOp() ) (pre_cross_attn_layernorm): IdentityOp() (cross_attention): IdentityOp() (cross_attn_bda): IdentityFuncOp() (pre_mlp_layernorm): RMSNorm() (mlp): MLP( (linear_fc1): ColumnParallelLinear() (linear_fc2): RowParallelLinear() ) ) ) (final_layernorm): RMSNorm() ) (output_layer): ColumnParallelLinear() ) model GPTVLModel( (external_feature_model): MegatronVisionModel( (vit): InternViTModel( (conv1): Conv2d(3, 1024, kernel_size=(14, 14), stride=(14, 14)) (position_embeddings): Embedding(1025, 1024) (decoder): TransformerBlock( (layers): ModuleList( (0-23): 24 x InternViTTransformerLayer( (input_layernorm): LayerNorm((1024,), eps=1e-06, elementwise_affine=True) (self_attention): SelfAttention( (core_attention): DotProductAttention( (scale_mask_softmax): FusedScaleMaskSoftmax() (attention_dropout): Dropout(p=0.0, inplace=False) ) (linear_proj): RowParallelLinear() (linear_qkv): ColumnParallelLinear() ) (self_attn_bda): IdentityFuncOp() (pre_cross_attn_layernorm): IdentityOp() (cross_attention): IdentityOp() (cross_attn_bda): IdentityFuncOp() (pre_mlp_layernorm): LayerNorm((1024,), eps=1e-06, elementwise_affine=True) (mlp): MLP( (linear_fc1): ColumnParallelLinear() (linear_fc2): RowParallelLinear() ) (mlp_bda): IdentityFuncOp() ) ) ) ) (vision_projection): MultimodalProjector( (encoder): MLP( (linear_fc1): ColumnParallelLinear() (linear_fc2): RowParallelLinear() ) ) (pre_proj_layernorm): LayerNorm((4096,), eps=1e-05, elementwise_affine=True) ) (embedding): LanguageModelEmbedding( (word_embeddings): VocabParallelEmbedding() (embedding_dropout): Dropout(p=0.0, inplace=False) ) (rotary_pos_emb): RotaryEmbedding() (decoder): TransformerBlock( (layers): ModuleList( (0-47): 48 x TransformerLayer( (input_layernorm): RMSNorm() (self_attention): SelfAttention( (core_attention): DotProductAttention( (scale_mask_softmax): FusedScaleMaskSoftmax() (attention_dropout): Dropout(p=0.0, inplace=False) ) (linear_proj): RowParallelLinear() (linear_qkv): ColumnParallelLinear() (q_layernorm): IdentityOp() (k_layernorm): IdentityOp() ) (pre_cross_attn_layernorm): IdentityOp() (cross_attention): IdentityOp() (cross_attn_bda): IdentityFuncOp() (pre_mlp_layernorm): RMSNorm() (mlp): MLP( (linear_fc1): ColumnParallelLinear() (linear_fc2): RowParallelLinear() ) ) ) (final_layernorm): RMSNorm() ) (output_layer): ColumnParallelLinear() ) name module.module.external_feature_model.vit.class_token lr_decay_rate 1.0 _get_param_groups name module.module.external_feature_model.vit.class_token key (1.0, 0.1, False, False) name module.module.external_feature_model.vit.conv1.weight lr_decay_rate 0.0717897987691853 _get_param_groups name module.module.external_feature_model.vit.conv1.weight key (1.0, 0.00717897987691853, False, False) name module.module.external_feature_model.vit.conv1.bias lr_decay_rate 0.0717897987691853 _get_param_groups name module.module.external_feature_model.vit.conv1.bias key (0.0, 0.00717897987691853, False, False) name module.module.external_feature_model.vit.position_embeddings.weight lr_decay_rate 0.0717897987691853 _get_param_groups name module.module.external_feature_model.vit.position_embeddings.weight key (1.0, 0.00717897987691853, False, False) name module.module.external_feature_model.vit.decoder.layers.0.ls1 lr_decay_rate 0.07976644307687256 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.ls1 key (0.0, 0.007976644307687256, False, False) name module.module.external_feature_model.vit.decoder.layers.0.ls2 lr_decay_rate 0.07976644307687256 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.ls2 key (0.0, 0.007976644307687256, False, False) name module.module.external_feature_model.vit.decoder.layers.0.input_layernorm.weight lr_decay_rate 0.07976644307687256 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.input_layernorm.weight key (0.0, 0.007976644307687256, False, False) name module.module.external_feature_model.vit.decoder.layers.0.input_layernorm.bias lr_decay_rate 0.07976644307687256 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.input_layernorm.bias key (0.0, 0.007976644307687256, False, False) name module.module.external_feature_model.vit.decoder.layers.0.self_attention.linear_proj.weight lr_decay_rate 0.07976644307687256 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.self_attention.linear_proj.weight key (1.0, 0.007976644307687256, False, False) name module.module.external_feature_model.vit.decoder.layers.0.self_attention.linear_proj.bias lr_decay_rate 0.07976644307687256 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.self_attention.linear_proj.bias key (0.0, 0.007976644307687256, False, False) name module.module.external_feature_model.vit.decoder.layers.0.self_attention.linear_qkv.weight lr_decay_rate 0.07976644307687256 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.self_attention.linear_qkv.weight key (1.0, 0.007976644307687256, False, False) name module.module.external_feature_model.vit.decoder.layers.0.self_attention.linear_qkv.bias lr_decay_rate 0.07976644307687256 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.self_attention.linear_qkv.bias key (0.0, 0.007976644307687256, False, False) name module.module.external_feature_model.vit.decoder.layers.0.pre_mlp_layernorm.weight lr_decay_rate 0.07976644307687256 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.pre_mlp_layernorm.weight key (0.0, 0.007976644307687256, False, False) name module.module.external_feature_model.vit.decoder.layers.0.pre_mlp_layernorm.bias lr_decay_rate 0.07976644307687256 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.pre_mlp_layernorm.bias key (0.0, 0.007976644307687256, False, False) name module.module.external_feature_model.vit.decoder.layers.0.mlp.linear_fc1.weight lr_decay_rate 0.07976644307687256 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.mlp.linear_fc1.weight key (1.0, 0.007976644307687256, False, False) name module.module.external_feature_model.vit.decoder.layers.0.mlp.linear_fc1.bias lr_decay_rate 0.07976644307687256 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.mlp.linear_fc1.bias key (0.0, 0.007976644307687256, False, False) name module.module.external_feature_model.vit.decoder.layers.0.mlp.linear_fc2.weight lr_decay_rate 0.07976644307687256 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.mlp.linear_fc2.weight key (1.0, 0.007976644307687256, False, False) name module.module.external_feature_model.vit.decoder.layers.0.mlp.linear_fc2.bias lr_decay_rate 0.07976644307687256 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.mlp.linear_fc2.bias key (0.0, 0.007976644307687256, False, False) name module.module.external_feature_model.vit.decoder.layers.1.ls1 lr_decay_rate 0.08862938119652507 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.ls1 key (0.0, 0.008862938119652507, False, False) name module.module.external_feature_model.vit.decoder.layers.1.ls2 lr_decay_rate 0.08862938119652507 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.ls2 key (0.0, 0.008862938119652507, False, False) name module.module.external_feature_model.vit.decoder.layers.1.input_layernorm.weight lr_decay_rate 0.08862938119652507 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.input_layernorm.weight key (0.0, 0.008862938119652507, False, False) name module.module.external_feature_model.vit.decoder.layers.1.input_layernorm.bias lr_decay_rate 0.08862938119652507 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.input_layernorm.bias key (0.0, 0.008862938119652507, False, False) name module.module.external_feature_model.vit.decoder.layers.1.self_attention.linear_proj.weight lr_decay_rate 0.08862938119652507 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.self_attention.linear_proj.weight key (1.0, 0.008862938119652507, False, False) name module.module.external_feature_model.vit.decoder.layers.1.self_attention.linear_proj.bias lr_decay_rate 0.08862938119652507 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.self_attention.linear_proj.bias key (0.0, 0.008862938119652507, False, False) name module.module.external_feature_model.vit.decoder.layers.1.self_attention.linear_qkv.weight lr_decay_rate 0.08862938119652507 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.self_attention.linear_qkv.weight key (1.0, 0.008862938119652507, False, False) name module.module.external_feature_model.vit.decoder.layers.1.self_attention.linear_qkv.bias lr_decay_rate 0.08862938119652507 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.self_attention.linear_qkv.bias key (0.0, 0.008862938119652507, False, False) name module.module.external_feature_model.vit.decoder.layers.1.pre_mlp_layernorm.weight lr_decay_rate 0.08862938119652507 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.pre_mlp_layernorm.weight key (0.0, 0.008862938119652507, False, False) name module.module.external_feature_model.vit.decoder.layers.1.pre_mlp_layernorm.bias lr_decay_rate 0.08862938119652507 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.pre_mlp_layernorm.bias key (0.0, 0.008862938119652507, False, False) name module.module.external_feature_model.vit.decoder.layers.1.mlp.linear_fc1.weight lr_decay_rate 0.08862938119652507 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.mlp.linear_fc1.weight key (1.0, 0.008862938119652507, False, False) name module.module.external_feature_model.vit.decoder.layers.1.mlp.linear_fc1.bias lr_decay_rate 0.08862938119652507 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.mlp.linear_fc1.bias key (0.0, 0.008862938119652507, False, False) name module.module.external_feature_model.vit.decoder.layers.1.mlp.linear_fc2.weight lr_decay_rate 0.08862938119652507 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.mlp.linear_fc2.weight key (1.0, 0.008862938119652507, False, False) name module.module.external_feature_model.vit.decoder.layers.1.mlp.linear_fc2.bias lr_decay_rate 0.08862938119652507 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.mlp.linear_fc2.bias key (0.0, 0.008862938119652507, False, False) name module.module.external_feature_model.vit.decoder.layers.2.ls1 lr_decay_rate 0.09847709021836118 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.ls1 key (0.0, 0.00984770902183612, False, False) name module.module.external_feature_model.vit.decoder.layers.2.ls2 lr_decay_rate 0.09847709021836118 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.ls2 key (0.0, 0.00984770902183612, False, False) name module.module.external_feature_model.vit.decoder.layers.2.input_layernorm.weight lr_decay_rate 0.09847709021836118 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.input_layernorm.weight key (0.0, 0.00984770902183612, False, False) name module.module.external_feature_model.vit.decoder.layers.2.input_layernorm.bias lr_decay_rate 0.09847709021836118 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.input_layernorm.bias key (0.0, 0.00984770902183612, False, False) name module.module.external_feature_model.vit.decoder.layers.2.self_attention.linear_proj.weight lr_decay_rate 0.09847709021836118 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.self_attention.linear_proj.weight key (1.0, 0.00984770902183612, False, False) name module.module.external_feature_model.vit.decoder.layers.2.self_attention.linear_proj.bias lr_decay_rate 0.09847709021836118 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.self_attention.linear_proj.bias key (0.0, 0.00984770902183612, False, False) name module.module.external_feature_model.vit.decoder.layers.2.self_attention.linear_qkv.weight lr_decay_rate 0.09847709021836118 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.self_attention.linear_qkv.weight key (1.0, 0.00984770902183612, False, False) name module.module.external_feature_model.vit.decoder.layers.2.self_attention.linear_qkv.bias lr_decay_rate 0.09847709021836118 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.self_attention.linear_qkv.bias key (0.0, 0.00984770902183612, False, False) name module.module.external_feature_model.vit.decoder.layers.2.pre_mlp_layernorm.weight lr_decay_rate 0.09847709021836118 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.pre_mlp_layernorm.weight key (0.0, 0.00984770902183612, False, False) name module.module.external_feature_model.vit.decoder.layers.2.pre_mlp_layernorm.bias lr_decay_rate 0.09847709021836118 name module.module.external_feature_model.vit.class_token lr_decay_rate 1.0_get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.pre_mlp_layernorm.bias key (0.0, 0.00984770902183612, False, False) name module.module.external_feature_model.vit.decoder.layers.2.mlp.linear_fc1.weight lr_decay_rate 0.09847709021836118 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.mlp.linear_fc1.weight key (1.0, 0.00984770902183612, False, False) name module.module.external_feature_model.vit.decoder.layers.2.mlp.linear_fc1.bias lr_decay_rate 0.09847709021836118 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.mlp.linear_fc1.bias key (0.0, 0.00984770902183612, False, False) name module.module.external_feature_model.vit.decoder.layers.2.mlp.linear_fc2.weight lr_decay_rate 0.09847709021836118 name module.module.external_feature_model.vit.class_token lr_decay_rate 1.0_get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.mlp.linear_fc2.weight key (1.0, 0.00984770902183612, False, False) name module.module.external_feature_model.vit.decoder.layers.2.mlp.linear_fc2.bias lr_decay_rate 0.09847709021836118 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.mlp.linear_fc2.bias key (0.0, 0.00984770902183612, False, False) _get_param_groups name module.module.external_feature_model.vit.class_token key (1.0, 0.1, False, False) name module.module.external_feature_model.vit.decoder.layers.3.ls1 lr_decay_rate 0.10941898913151242 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.ls1 key (0.0, 0.010941898913151242, False, False) name module.module.external_feature_model.vit.conv1.weight lr_decay_rate 0.0717897987691853 name module.module.external_feature_model.vit.decoder.layers.3.ls2 lr_decay_rate 0.10941898913151242 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.ls2 key (0.0, 0.010941898913151242, False, False) _get_param_groups name module.module.external_feature_model.vit.conv1.weight key (1.0, 0.00717897987691853, False, False) name module.module.external_feature_model.vit.decoder.layers.3.input_layernorm.weight lr_decay_rate 0.10941898913151242 name module.module.external_feature_model.vit.conv1.bias lr_decay_rate 0.0717897987691853 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.input_layernorm.weight key (0.0, 0.010941898913151242, False, False) _get_param_groups name module.module.external_feature_model.vit.conv1.bias key (0.0, 0.00717897987691853, False, False) name module.module.external_feature_model.vit.decoder.layers.3.input_layernorm.bias lr_decay_rate 0.10941898913151242 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.input_layernorm.bias key (0.0, 0.010941898913151242, False, False) name module.module.external_feature_model.vit.position_embeddings.weight lr_decay_rate 0.0717897987691853 _get_param_groups name module.module.external_feature_model.vit.class_token key (1.0, 0.1, False, False) _get_param_groups name module.module.external_feature_model.vit.position_embeddings.weight key (1.0, 0.00717897987691853, False, False) name module.module.external_feature_model.vit.decoder.layers.3.self_attention.linear_proj.weight lr_decay_rate 0.10941898913151242 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.self_attention.linear_proj.weight key (1.0, 0.010941898913151242, False, False) name module.module.external_feature_model.vit.class_token lr_decay_rate 1.0 name module.module.external_feature_model.vit.conv1.weight lr_decay_rate 0.0717897987691853 name module.module.external_feature_model.vit.decoder.layers.0.ls1 lr_decay_rate 0.07976644307687256 name module.module.external_feature_model.vit.decoder.layers.3.self_attention.linear_proj.bias lr_decay_rate 0.10941898913151242 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.ls1 key (0.0, 0.007976644307687256, False, False) _get_param_groups name module.module.external_feature_model.vit.conv1.weight key (1.0, 0.00717897987691853, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.self_attention.linear_proj.bias key (0.0, 0.010941898913151242, False, False) name module.module.external_feature_model.vit.decoder.layers.0.ls2 lr_decay_rate 0.07976644307687256 name module.module.external_feature_model.vit.conv1.bias lr_decay_rate 0.0717897987691853 name module.module.external_feature_model.vit.decoder.layers.3.self_attention.linear_qkv.weight lr_decay_rate 0.10941898913151242 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.ls2 key (0.0, 0.007976644307687256, False, False) _get_param_groups name module.module.external_feature_model.vit.conv1.bias key (0.0, 0.00717897987691853, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.self_attention.linear_qkv.weight key (1.0, 0.010941898913151242, False, False) name module.module.external_feature_model.vit.decoder.layers.0.input_layernorm.weight lr_decay_rate 0.07976644307687256name module.module.external_feature_model.vit.decoder.layers.3.self_attention.linear_qkv.bias lr_decay_rate 0.10941898913151242 name module.module.external_feature_model.vit.position_embeddings.weight lr_decay_rate 0.0717897987691853 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.self_attention.linear_qkv.bias key (0.0, 0.010941898913151242, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.input_layernorm.weight key (0.0, 0.007976644307687256, False, False) name module.module.external_feature_model.vit.class_token lr_decay_rate 1.0_get_param_groups name module.module.external_feature_model.vit.position_embeddings.weight key (1.0, 0.00717897987691853, False, False) name module.module.external_feature_model.vit.decoder.layers.0.input_layernorm.bias lr_decay_rate 0.07976644307687256 name module.module.external_feature_model.vit.decoder.layers.3.pre_mlp_layernorm.weight lr_decay_rate 0.10941898913151242 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.input_layernorm.bias key (0.0, 0.007976644307687256, False, False) name module.module.external_feature_model.vit.decoder.layers.0.ls1 lr_decay_rate 0.07976644307687256 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.pre_mlp_layernorm.weight key (0.0, 0.010941898913151242, False, False) name module.module.external_feature_model.vit.decoder.layers.3.pre_mlp_layernorm.bias lr_decay_rate 0.10941898913151242_get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.ls1 key (0.0, 0.007976644307687256, False, False)name module.module.external_feature_model.vit.decoder.layers.0.self_attention.linear_proj.weight lr_decay_rate 0.07976644307687256 _get_param_groups name module.module.external_feature_model.vit.class_token key (1.0, 0.1, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.pre_mlp_layernorm.bias key (0.0, 0.010941898913151242, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.self_attention.linear_proj.weight key (1.0, 0.007976644307687256, False, False)name module.module.external_feature_model.vit.decoder.layers.0.ls2 lr_decay_rate 0.07976644307687256 name module.module.external_feature_model.vit.decoder.layers.3.mlp.linear_fc1.weight lr_decay_rate 0.10941898913151242 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.ls2 key (0.0, 0.007976644307687256, False, False) name module.module.external_feature_model.vit.decoder.layers.0.self_attention.linear_proj.bias lr_decay_rate 0.07976644307687256 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.mlp.linear_fc1.weight key (1.0, 0.010941898913151242, False, False)name module.module.external_feature_model.vit.conv1.weight lr_decay_rate 0.0717897987691853 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.self_attention.linear_proj.bias key (0.0, 0.007976644307687256, False, False) name module.module.external_feature_model.vit.decoder.layers.0.input_layernorm.weight lr_decay_rate 0.07976644307687256 name module.module.external_feature_model.vit.decoder.layers.3.mlp.linear_fc1.bias lr_decay_rate 0.10941898913151242 _get_param_groups name module.module.external_feature_model.vit.conv1.weight key (1.0, 0.00717897987691853, False, False)name module.module.external_feature_model.vit.decoder.layers.0.self_attention.linear_qkv.weight lr_decay_rate 0.07976644307687256_get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.input_layernorm.weight key (0.0, 0.007976644307687256, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.mlp.linear_fc1.bias key (0.0, 0.010941898913151242, False, False) _get_param_groups name module.module.external_feature_model.vit.class_token key (1.0, 0.1, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.self_attention.linear_qkv.weight key (1.0, 0.007976644307687256, False, False) name module.module.external_feature_model.vit.decoder.layers.0.input_layernorm.bias lr_decay_rate 0.07976644307687256name module.module.external_feature_model.vit.conv1.bias lr_decay_rate 0.0717897987691853 name module.module.external_feature_model.vit.decoder.layers.3.mlp.linear_fc2.weight lr_decay_rate 0.10941898913151242 name module.module.external_feature_model.vit.decoder.layers.0.self_attention.linear_qkv.bias lr_decay_rate 0.07976644307687256 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.input_layernorm.bias key (0.0, 0.007976644307687256, False, False) _get_param_groups name module.module.external_feature_model.vit.conv1.bias key (0.0, 0.00717897987691853, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.mlp.linear_fc2.weight key (1.0, 0.010941898913151242, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.self_attention.linear_qkv.bias key (0.0, 0.007976644307687256, False, False) name module.module.external_feature_model.vit.conv1.weight lr_decay_rate 0.0717897987691853 name module.module.external_feature_model.vit.decoder.layers.3.mlp.linear_fc2.bias lr_decay_rate 0.10941898913151242 name module.module.external_feature_model.vit.position_embeddings.weight lr_decay_rate 0.0717897987691853 name module.module.external_feature_model.vit.decoder.layers.0.self_attention.linear_proj.weight lr_decay_rate 0.07976644307687256 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.mlp.linear_fc2.bias key (0.0, 0.010941898913151242, False, False) _get_param_groups name module.module.external_feature_model.vit.conv1.weight key (1.0, 0.00717897987691853, False, False)name module.module.external_feature_model.vit.decoder.layers.0.pre_mlp_layernorm.weight lr_decay_rate 0.07976644307687256 _get_param_groups name module.module.external_feature_model.vit.position_embeddings.weight key (1.0, 0.00717897987691853, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.self_attention.linear_proj.weight key (1.0, 0.007976644307687256, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.pre_mlp_layernorm.weight key (0.0, 0.007976644307687256, False, False)name module.module.external_feature_model.vit.decoder.layers.4.ls1 lr_decay_rate 0.12157665459056935name module.module.external_feature_model.vit.conv1.bias lr_decay_rate 0.0717897987691853 name module.module.external_feature_model.vit.decoder.layers.0.self_attention.linear_proj.bias lr_decay_rate 0.07976644307687256 name module.module.external_feature_model.vit.decoder.layers.0.ls1 lr_decay_rate 0.07976644307687256_get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.ls1 key (0.0, 0.012157665459056936, False, False)name module.module.external_feature_model.vit.decoder.layers.0.pre_mlp_layernorm.bias lr_decay_rate 0.07976644307687256_get_param_groups name module.module.external_feature_model.vit.conv1.bias key (0.0, 0.00717897987691853, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.self_attention.linear_proj.bias key (0.0, 0.007976644307687256, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.pre_mlp_layernorm.bias key (0.0, 0.007976644307687256, False, False) name module.module.external_feature_model.vit.decoder.layers.4.ls2 lr_decay_rate 0.12157665459056935_get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.ls1 key (0.0, 0.007976644307687256, False, False) name module.module.external_feature_model.vit.decoder.layers.0.self_attention.linear_qkv.weight lr_decay_rate 0.07976644307687256name module.module.external_feature_model.vit.position_embeddings.weight lr_decay_rate 0.0717897987691853 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.ls2 key (0.0, 0.012157665459056936, False, False)name module.module.external_feature_model.vit.decoder.layers.0.mlp.linear_fc1.weight lr_decay_rate 0.07976644307687256 _get_param_groups name module.module.external_feature_model.vit.position_embeddings.weight key (1.0, 0.00717897987691853, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.self_attention.linear_qkv.weight key (1.0, 0.007976644307687256, False, False)name module.module.external_feature_model.vit.decoder.layers.0.ls2 lr_decay_rate 0.07976644307687256 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.mlp.linear_fc1.weight key (1.0, 0.007976644307687256, False, False) name module.module.external_feature_model.vit.decoder.layers.4.input_layernorm.weight lr_decay_rate 0.12157665459056935 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.ls2 key (0.0, 0.007976644307687256, False, False)name module.module.external_feature_model.vit.decoder.layers.0.self_attention.linear_qkv.bias lr_decay_rate 0.07976644307687256 name module.module.external_feature_model.vit.decoder.layers.0.mlp.linear_fc1.bias lr_decay_rate 0.07976644307687256 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.input_layernorm.weight key (0.0, 0.012157665459056936, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.self_attention.linear_qkv.bias key (0.0, 0.007976644307687256, False, False) name module.module.external_feature_model.vit.decoder.layers.0.ls1 lr_decay_rate 0.07976644307687256_get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.mlp.linear_fc1.bias key (0.0, 0.007976644307687256, False, False) name module.module.external_feature_model.vit.decoder.layers.0.input_layernorm.weight lr_decay_rate 0.07976644307687256 name module.module.external_feature_model.vit.decoder.layers.4.input_layernorm.bias lr_decay_rate 0.12157665459056935 name module.module.external_feature_model.vit.class_token lr_decay_rate 1.0 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.input_layernorm.weight key (0.0, 0.007976644307687256, False, False)name module.module.external_feature_model.vit.decoder.layers.0.pre_mlp_layernorm.weight lr_decay_rate 0.07976644307687256_get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.ls1 key (0.0, 0.007976644307687256, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.input_layernorm.bias key (0.0, 0.012157665459056936, False, False)name module.module.external_feature_model.vit.decoder.layers.0.mlp.linear_fc2.weight lr_decay_rate 0.07976644307687256 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.pre_mlp_layernorm.weight key (0.0, 0.007976644307687256, False, False)name module.module.external_feature_model.vit.decoder.layers.0.input_layernorm.bias lr_decay_rate 0.07976644307687256_get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.mlp.linear_fc2.weight key (1.0, 0.007976644307687256, False, False) name module.module.external_feature_model.vit.decoder.layers.0.ls2 lr_decay_rate 0.07976644307687256 name module.module.external_feature_model.vit.decoder.layers.4.self_attention.linear_proj.weight lr_decay_rate 0.12157665459056935 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.input_layernorm.bias key (0.0, 0.007976644307687256, False, False) name module.module.external_feature_model.vit.decoder.layers.0.mlp.linear_fc2.bias lr_decay_rate 0.07976644307687256name module.module.external_feature_model.vit.decoder.layers.0.pre_mlp_layernorm.bias lr_decay_rate 0.07976644307687256 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.ls2 key (0.0, 0.007976644307687256, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.self_attention.linear_proj.weight key (1.0, 0.012157665459056936, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.mlp.linear_fc2.bias key (0.0, 0.007976644307687256, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.pre_mlp_layernorm.bias key (0.0, 0.007976644307687256, False, False) name module.module.external_feature_model.vit.decoder.layers.0.self_attention.linear_proj.weight lr_decay_rate 0.07976644307687256 name module.module.external_feature_model.vit.decoder.layers.4.self_attention.linear_proj.bias lr_decay_rate 0.12157665459056935 name module.module.external_feature_model.vit.decoder.layers.0.input_layernorm.weight lr_decay_rate 0.07976644307687256 name module.module.external_feature_model.vit.decoder.layers.1.ls1 lr_decay_rate 0.08862938119652507_get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.self_attention.linear_proj.bias key (0.0, 0.012157665459056936, False, False)name module.module.external_feature_model.vit.decoder.layers.0.mlp.linear_fc1.weight lr_decay_rate 0.07976644307687256_get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.self_attention.linear_proj.weight key (1.0, 0.007976644307687256, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.input_layernorm.weight key (0.0, 0.007976644307687256, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.mlp.linear_fc1.weight key (1.0, 0.007976644307687256, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.ls1 key (0.0, 0.008862938119652507, False, False) name module.module.external_feature_model.vit.decoder.layers.0.input_layernorm.bias lr_decay_rate 0.07976644307687256name module.module.external_feature_model.vit.decoder.layers.0.self_attention.linear_proj.bias lr_decay_rate 0.07976644307687256 name module.module.external_feature_model.vit.decoder.layers.4.self_attention.linear_qkv.weight lr_decay_rate 0.12157665459056935 name module.module.external_feature_model.vit.decoder.layers.0.mlp.linear_fc1.bias lr_decay_rate 0.07976644307687256name module.module.external_feature_model.vit.decoder.layers.1.ls2 lr_decay_rate 0.08862938119652507_get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.input_layernorm.bias key (0.0, 0.007976644307687256, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.self_attention.linear_proj.bias key (0.0, 0.007976644307687256, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.self_attention.linear_qkv.weight key (1.0, 0.012157665459056936, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.ls2 key (0.0, 0.008862938119652507, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.mlp.linear_fc1.bias key (0.0, 0.007976644307687256, False, False) name module.module.external_feature_model.vit.decoder.layers.4.self_attention.linear_qkv.bias lr_decay_rate 0.12157665459056935 _get_param_groups name module.module.external_feature_model.vit.class_token key (1.0, 0.1, False, False)name module.module.external_feature_model.vit.decoder.layers.0.self_attention.linear_qkv.weight lr_decay_rate 0.07976644307687256 name module.module.external_feature_model.vit.decoder.layers.1.input_layernorm.weight lr_decay_rate 0.08862938119652507_get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.self_attention.linear_qkv.bias key (0.0, 0.012157665459056936, False, False)name module.module.external_feature_model.vit.decoder.layers.0.mlp.linear_fc2.weight lr_decay_rate 0.07976644307687256name module.module.external_feature_model.vit.decoder.layers.0.self_attention.linear_proj.weight lr_decay_rate 0.07976644307687256_get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.self_attention.linear_qkv.weight key (1.0, 0.007976644307687256, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.mlp.linear_fc2.weight key (1.0, 0.007976644307687256, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.input_layernorm.weight key (0.0, 0.008862938119652507, False, False)name module.module.external_feature_model.vit.decoder.layers.0.self_attention.linear_qkv.bias lr_decay_rate 0.07976644307687256_get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.self_attention.linear_proj.weight key (1.0, 0.007976644307687256, False, False)name module.module.external_feature_model.vit.decoder.layers.4.pre_mlp_layernorm.weight lr_decay_rate 0.12157665459056935 name module.module.external_feature_model.vit.conv1.weight lr_decay_rate 0.0717897987691853 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.self_attention.linear_qkv.bias key (0.0, 0.007976644307687256, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.pre_mlp_layernorm.weight key (0.0, 0.012157665459056936, False, False) name module.module.external_feature_model.vit.decoder.layers.0.self_attention.linear_proj.bias lr_decay_rate 0.07976644307687256name module.module.external_feature_model.vit.decoder.layers.0.mlp.linear_fc2.bias lr_decay_rate 0.07976644307687256 name module.module.external_feature_model.vit.decoder.layers.1.input_layernorm.bias lr_decay_rate 0.08862938119652507 _get_param_groups name module.module.external_feature_model.vit.conv1.weight key (1.0, 0.00717897987691853, False, False) name module.module.external_feature_model.vit.decoder.layers.4.pre_mlp_layernorm.bias lr_decay_rate 0.12157665459056935_get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.self_attention.linear_proj.bias key (0.0, 0.007976644307687256, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.mlp.linear_fc2.bias key (0.0, 0.007976644307687256, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.input_layernorm.bias key (0.0, 0.008862938119652507, False, False) name module.module.external_feature_model.vit.decoder.layers.0.pre_mlp_layernorm.weight lr_decay_rate 0.07976644307687256 name module.module.external_feature_model.vit.conv1.bias lr_decay_rate 0.0717897987691853 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.pre_mlp_layernorm.bias key (0.0, 0.012157665459056936, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.pre_mlp_layernorm.weight key (0.0, 0.007976644307687256, False, False) name module.module.external_feature_model.vit.decoder.layers.0.self_attention.linear_qkv.weight lr_decay_rate 0.07976644307687256 _get_param_groups name module.module.external_feature_model.vit.conv1.bias key (0.0, 0.00717897987691853, False, False) name module.module.external_feature_model.vit.decoder.layers.1.ls1 lr_decay_rate 0.08862938119652507 name module.module.external_feature_model.vit.decoder.layers.1.self_attention.linear_proj.weight lr_decay_rate 0.08862938119652507 name module.module.external_feature_model.vit.decoder.layers.4.mlp.linear_fc1.weight lr_decay_rate 0.12157665459056935 name module.module.external_feature_model.vit.decoder.layers.0.pre_mlp_layernorm.bias lr_decay_rate 0.07976644307687256 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.self_attention.linear_qkv.weight key (1.0, 0.007976644307687256, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.ls1 key (0.0, 0.008862938119652507, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.mlp.linear_fc1.weight key (1.0, 0.012157665459056936, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.self_attention.linear_proj.weight key (1.0, 0.008862938119652507, False, False) name module.module.external_feature_model.vit.position_embeddings.weight lr_decay_rate 0.0717897987691853_get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.pre_mlp_layernorm.bias key (0.0, 0.007976644307687256, False, False) name module.module.external_feature_model.vit.decoder.layers.0.self_attention.linear_qkv.bias lr_decay_rate 0.07976644307687256name module.module.external_feature_model.vit.decoder.layers.1.ls2 lr_decay_rate 0.08862938119652507name module.module.external_feature_model.vit.decoder.layers.4.mlp.linear_fc1.bias lr_decay_rate 0.12157665459056935name module.module.external_feature_model.vit.decoder.layers.1.self_attention.linear_proj.bias lr_decay_rate 0.08862938119652507_get_param_groups name module.module.external_feature_model.vit.position_embeddings.weight key (1.0, 0.00717897987691853, False, False)name module.module.external_feature_model.vit.decoder.layers.0.mlp.linear_fc1.weight lr_decay_rate 0.07976644307687256name module.module.external_feature_model.vit.class_token lr_decay_rate 1.0 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.ls2 key (0.0, 0.008862938119652507, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.mlp.linear_fc1.bias key (0.0, 0.012157665459056936, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.self_attention.linear_qkv.bias key (0.0, 0.007976644307687256, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.self_attention.linear_proj.bias key (0.0, 0.008862938119652507, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.mlp.linear_fc1.weight key (1.0, 0.007976644307687256, False, False) name module.module.external_feature_model.vit.decoder.layers.0.ls1 lr_decay_rate 0.07976644307687256name module.module.external_feature_model.vit.decoder.layers.1.input_layernorm.weight lr_decay_rate 0.08862938119652507 name module.module.external_feature_model.vit.class_token lr_decay_rate 1.0name module.module.external_feature_model.vit.decoder.layers.4.mlp.linear_fc2.weight lr_decay_rate 0.12157665459056935name module.module.external_feature_model.vit.decoder.layers.0.mlp.linear_fc1.bias lr_decay_rate 0.07976644307687256 name module.module.external_feature_model.vit.decoder.layers.1.self_attention.linear_qkv.weight lr_decay_rate 0.08862938119652507 name module.module.external_feature_model.vit.decoder.layers.0.pre_mlp_layernorm.weight lr_decay_rate 0.07976644307687256 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.input_layernorm.weight key (0.0, 0.008862938119652507, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.ls1 key (0.0, 0.007976644307687256, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.mlp.linear_fc1.bias key (0.0, 0.007976644307687256, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.mlp.linear_fc2.weight key (1.0, 0.012157665459056936, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.self_attention.linear_qkv.weight key (1.0, 0.008862938119652507, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.pre_mlp_layernorm.weight key (0.0, 0.007976644307687256, False, False) name module.module.external_feature_model.vit.decoder.layers.1.input_layernorm.bias lr_decay_rate 0.08862938119652507 name module.module.external_feature_model.vit.decoder.layers.4.mlp.linear_fc2.bias lr_decay_rate 0.12157665459056935 name module.module.external_feature_model.vit.decoder.layers.0.ls2 lr_decay_rate 0.07976644307687256 name module.module.external_feature_model.vit.decoder.layers.0.mlp.linear_fc2.weight lr_decay_rate 0.07976644307687256 name module.module.external_feature_model.vit.decoder.layers.1.self_attention.linear_qkv.bias lr_decay_rate 0.08862938119652507 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.input_layernorm.bias key (0.0, 0.008862938119652507, False, False)name module.module.external_feature_model.vit.decoder.layers.0.pre_mlp_layernorm.bias lr_decay_rate 0.07976644307687256 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.mlp.linear_fc2.bias key (0.0, 0.012157665459056936, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.ls2 key (0.0, 0.007976644307687256, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.self_attention.linear_qkv.bias key (0.0, 0.008862938119652507, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.mlp.linear_fc2.weight key (1.0, 0.007976644307687256, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.pre_mlp_layernorm.bias key (0.0, 0.007976644307687256, False, False) name module.module.external_feature_model.vit.decoder.layers.5.ls1 lr_decay_rate 0.13508517176729928 name module.module.external_feature_model.vit.decoder.layers.0.input_layernorm.weight lr_decay_rate 0.07976644307687256name module.module.external_feature_model.vit.decoder.layers.1.self_attention.linear_proj.weight lr_decay_rate 0.08862938119652507name module.module.external_feature_model.vit.decoder.layers.0.mlp.linear_fc2.bias lr_decay_rate 0.07976644307687256 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.ls1 key (0.0, 0.013508517176729929, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.mlp.linear_fc2.bias key (0.0, 0.007976644307687256, False, False)name module.module.external_feature_model.vit.decoder.layers.0.mlp.linear_fc1.weight lr_decay_rate 0.07976644307687256_get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.input_layernorm.weight key (0.0, 0.007976644307687256, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.self_attention.linear_proj.weight key (1.0, 0.008862938119652507, False, False)name module.module.external_feature_model.vit.decoder.layers.1.pre_mlp_layernorm.weight lr_decay_rate 0.08862938119652507 _get_param_groups name module.module.external_feature_model.vit.class_token key (1.0, 0.1, False, False)name module.module.external_feature_model.vit.decoder.layers.0.input_layernorm.bias lr_decay_rate 0.07976644307687256 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.mlp.linear_fc1.weight key (1.0, 0.007976644307687256, False, False)name module.module.external_feature_model.vit.decoder.layers.5.ls2 lr_decay_rate 0.13508517176729928_get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.pre_mlp_layernorm.weight key (0.0, 0.008862938119652507, False, False)name module.module.external_feature_model.vit.decoder.layers.1.self_attention.linear_proj.bias lr_decay_rate 0.08862938119652507 name module.module.external_feature_model.vit.decoder.layers.1.ls1 lr_decay_rate 0.08862938119652507 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.input_layernorm.bias key (0.0, 0.007976644307687256, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.ls2 key (0.0, 0.013508517176729929, False, False)name module.module.external_feature_model.vit.decoder.layers.0.mlp.linear_fc1.bias lr_decay_rate 0.07976644307687256_get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.self_attention.linear_proj.bias key (0.0, 0.008862938119652507, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.ls1 key (0.0, 0.008862938119652507, False, False) name module.module.external_feature_model.vit.decoder.layers.1.pre_mlp_layernorm.bias lr_decay_rate 0.08862938119652507 name module.module.external_feature_model.vit.conv1.weight lr_decay_rate 0.0717897987691853 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.mlp.linear_fc1.bias key (0.0, 0.007976644307687256, False, False) name module.module.external_feature_model.vit.decoder.layers.1.self_attention.linear_qkv.weight lr_decay_rate 0.08862938119652507_get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.pre_mlp_layernorm.bias key (0.0, 0.008862938119652507, False, False)name module.module.external_feature_model.vit.decoder.layers.1.ls2 lr_decay_rate 0.08862938119652507 name module.module.external_feature_model.vit.decoder.layers.5.input_layernorm.weight lr_decay_rate 0.13508517176729928_get_param_groups name module.module.external_feature_model.vit.class_token key (1.0, 0.1, False, False) name module.module.external_feature_model.vit.decoder.layers.0.self_attention.linear_proj.weight lr_decay_rate 0.07976644307687256 _get_param_groups name module.module.external_feature_model.vit.conv1.weight key (1.0, 0.00717897987691853, False, False) name module.module.external_feature_model.vit.decoder.layers.0.mlp.linear_fc2.weight lr_decay_rate 0.07976644307687256 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.self_attention.linear_qkv.weight key (1.0, 0.008862938119652507, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.input_layernorm.weight key (0.0, 0.013508517176729929, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.ls2 key (0.0, 0.008862938119652507, False, False) name module.module.external_feature_model.vit.decoder.layers.1.mlp.linear_fc1.weight lr_decay_rate 0.08862938119652507 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.self_attention.linear_proj.weight key (1.0, 0.007976644307687256, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.mlp.linear_fc2.weight key (1.0, 0.007976644307687256, False, False)name module.module.external_feature_model.vit.conv1.bias lr_decay_rate 0.0717897987691853 name module.module.external_feature_model.vit.decoder.layers.1.self_attention.linear_qkv.bias lr_decay_rate 0.08862938119652507name module.module.external_feature_model.vit.decoder.layers.5.input_layernorm.bias lr_decay_rate 0.13508517176729928 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.mlp.linear_fc1.weight key (1.0, 0.008862938119652507, False, False)name module.module.external_feature_model.vit.decoder.layers.1.input_layernorm.weight lr_decay_rate 0.08862938119652507 name module.module.external_feature_model.vit.decoder.layers.0.self_attention.linear_proj.bias lr_decay_rate 0.07976644307687256 name module.module.external_feature_model.vit.conv1.weight lr_decay_rate 0.0717897987691853_get_param_groups name module.module.external_feature_model.vit.conv1.bias key (0.0, 0.00717897987691853, False, False)name module.module.external_feature_model.vit.decoder.layers.0.mlp.linear_fc2.bias lr_decay_rate 0.07976644307687256 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.self_attention.linear_qkv.bias key (0.0, 0.008862938119652507, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.input_layernorm.bias key (0.0, 0.013508517176729929, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.input_layernorm.weight key (0.0, 0.008862938119652507, False, False)name module.module.external_feature_model.vit.decoder.layers.1.mlp.linear_fc1.bias lr_decay_rate 0.08862938119652507_get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.self_attention.linear_proj.bias key (0.0, 0.007976644307687256, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.mlp.linear_fc2.bias key (0.0, 0.007976644307687256, False, False) name module.module.external_feature_model.vit.position_embeddings.weight lr_decay_rate 0.0717897987691853_get_param_groups name module.module.external_feature_model.vit.conv1.weight key (1.0, 0.00717897987691853, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.mlp.linear_fc1.bias key (0.0, 0.008862938119652507, False, False)name module.module.external_feature_model.vit.decoder.layers.1.input_layernorm.bias lr_decay_rate 0.08862938119652507 name module.module.external_feature_model.vit.decoder.layers.5.self_attention.linear_proj.weight lr_decay_rate 0.13508517176729928 name module.module.external_feature_model.vit.decoder.layers.1.pre_mlp_layernorm.weight lr_decay_rate 0.08862938119652507 name module.module.external_feature_model.vit.decoder.layers.0.self_attention.linear_qkv.weight lr_decay_rate 0.07976644307687256 _get_param_groups name module.module.external_feature_model.vit.position_embeddings.weight key (1.0, 0.00717897987691853, False, False)name module.module.external_feature_model.vit.decoder.layers.1.ls1 lr_decay_rate 0.08862938119652507_get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.input_layernorm.bias key (0.0, 0.008862938119652507, False, False)name module.module.external_feature_model.vit.conv1.bias lr_decay_rate 0.0717897987691853_get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.self_attention.linear_qkv.weight key (1.0, 0.007976644307687256, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.pre_mlp_layernorm.weight key (0.0, 0.008862938119652507, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.self_attention.linear_proj.weight key (1.0, 0.013508517176729929, False, False) name module.module.external_feature_model.vit.decoder.layers.1.mlp.linear_fc2.weight lr_decay_rate 0.08862938119652507 _get_param_groups name module.module.external_feature_model.vit.conv1.bias key (0.0, 0.00717897987691853, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.ls1 key (0.0, 0.008862938119652507, False, False)name module.module.external_feature_model.vit.decoder.layers.5.self_attention.linear_proj.bias lr_decay_rate 0.13508517176729928 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.mlp.linear_fc2.weight key (1.0, 0.008862938119652507, False, False)name module.module.external_feature_model.vit.decoder.layers.1.pre_mlp_layernorm.bias lr_decay_rate 0.08862938119652507name module.module.external_feature_model.vit.decoder.layers.0.self_attention.linear_qkv.bias lr_decay_rate 0.07976644307687256 name module.module.external_feature_model.vit.decoder.layers.1.self_attention.linear_proj.weight lr_decay_rate 0.08862938119652507 name module.module.external_feature_model.vit.decoder.layers.0.ls1 lr_decay_rate 0.07976644307687256 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.self_attention.linear_proj.bias key (0.0, 0.013508517176729929, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.self_attention.linear_qkv.bias key (0.0, 0.007976644307687256, False, False) name module.module.external_feature_model.vit.position_embeddings.weight lr_decay_rate 0.0717897987691853 name module.module.external_feature_model.vit.decoder.layers.1.ls2 lr_decay_rate 0.08862938119652507 name module.module.external_feature_model.vit.decoder.layers.1.mlp.linear_fc2.bias lr_decay_rate 0.08862938119652507_get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.pre_mlp_layernorm.bias key (0.0, 0.008862938119652507, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.self_attention.linear_proj.weight key (1.0, 0.008862938119652507, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.ls1 key (0.0, 0.007976644307687256, False, False) _get_param_groups name module.module.external_feature_model.vit.position_embeddings.weight key (1.0, 0.00717897987691853, False, False)name module.module.external_feature_model.vit.decoder.layers.5.self_attention.linear_qkv.weight lr_decay_rate 0.13508517176729928 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.ls2 key (0.0, 0.008862938119652507, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.mlp.linear_fc2.bias key (0.0, 0.008862938119652507, False, False) name module.module.external_feature_model.vit.decoder.layers.0.pre_mlp_layernorm.weight lr_decay_rate 0.07976644307687256name module.module.external_feature_model.vit.decoder.layers.1.self_attention.linear_proj.bias lr_decay_rate 0.08862938119652507name module.module.external_feature_model.vit.decoder.layers.0.ls2 lr_decay_rate 0.07976644307687256 name module.module.external_feature_model.vit.decoder.layers.1.mlp.linear_fc1.weight lr_decay_rate 0.08862938119652507_get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.self_attention.linear_qkv.weight key (1.0, 0.013508517176729929, False, False) name module.module.external_feature_model.vit.decoder.layers.1.input_layernorm.weight lr_decay_rate 0.08862938119652507 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.ls2 key (0.0, 0.007976644307687256, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.pre_mlp_layernorm.weight key (0.0, 0.007976644307687256, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.mlp.linear_fc1.weight key (1.0, 0.008862938119652507, False, False)name module.module.external_feature_model.vit.decoder.layers.2.ls1 lr_decay_rate 0.09847709021836118 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.self_attention.linear_proj.bias key (0.0, 0.008862938119652507, False, False)name module.module.external_feature_model.vit.decoder.layers.5.self_attention.linear_qkv.bias lr_decay_rate 0.13508517176729928 name module.module.external_feature_model.vit.decoder.layers.0.ls1 lr_decay_rate 0.07976644307687256 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.input_layernorm.weight key (0.0, 0.008862938119652507, False, False) name module.module.external_feature_model.vit.decoder.layers.1.mlp.linear_fc1.bias lr_decay_rate 0.08862938119652507_get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.ls1 key (0.0, 0.00984770902183612, False, False)name module.module.external_feature_model.vit.decoder.layers.0.pre_mlp_layernorm.bias lr_decay_rate 0.07976644307687256_get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.self_attention.linear_qkv.bias key (0.0, 0.013508517176729929, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.ls1 key (0.0, 0.007976644307687256, False, False)name module.module.external_feature_model.vit.decoder.layers.1.self_attention.linear_qkv.weight lr_decay_rate 0.08862938119652507 name module.module.external_feature_model.vit.decoder.layers.0.input_layernorm.weight lr_decay_rate 0.07976644307687256name module.module.external_feature_model.vit.decoder.layers.1.input_layernorm.bias lr_decay_rate 0.08862938119652507 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.mlp.linear_fc1.bias key (0.0, 0.008862938119652507, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.pre_mlp_layernorm.bias key (0.0, 0.007976644307687256, False, False) name module.module.external_feature_model.vit.decoder.layers.2.ls2 lr_decay_rate 0.09847709021836118 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.input_layernorm.weight key (0.0, 0.007976644307687256, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.self_attention.linear_qkv.weight key (1.0, 0.008862938119652507, False, False)name module.module.external_feature_model.vit.decoder.layers.0.ls2 lr_decay_rate 0.07976644307687256 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.input_layernorm.bias key (0.0, 0.008862938119652507, False, False)name module.module.external_feature_model.vit.decoder.layers.5.pre_mlp_layernorm.weight lr_decay_rate 0.13508517176729928 name module.module.external_feature_model.vit.decoder.layers.1.mlp.linear_fc2.weight lr_decay_rate 0.08862938119652507_get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.ls2 key (0.0, 0.00984770902183612, False, False) name module.module.external_feature_model.vit.decoder.layers.0.mlp.linear_fc1.weight lr_decay_rate 0.07976644307687256 name module.module.external_feature_model.vit.decoder.layers.0.input_layernorm.bias lr_decay_rate 0.07976644307687256 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.ls2 key (0.0, 0.007976644307687256, False, False)name module.module.external_feature_model.vit.decoder.layers.1.self_attention.linear_qkv.bias lr_decay_rate 0.08862938119652507 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.pre_mlp_layernorm.weight key (0.0, 0.013508517176729929, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.mlp.linear_fc2.weight key (1.0, 0.008862938119652507, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.input_layernorm.bias key (0.0, 0.007976644307687256, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.mlp.linear_fc1.weight key (1.0, 0.007976644307687256, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.self_attention.linear_qkv.bias key (0.0, 0.008862938119652507, False, False)name module.module.external_feature_model.vit.decoder.layers.2.input_layernorm.weight lr_decay_rate 0.09847709021836118 name module.module.external_feature_model.vit.decoder.layers.1.self_attention.linear_proj.weight lr_decay_rate 0.08862938119652507 name module.module.external_feature_model.vit.decoder.layers.0.input_layernorm.weight lr_decay_rate 0.07976644307687256name module.module.external_feature_model.vit.decoder.layers.5.pre_mlp_layernorm.bias lr_decay_rate 0.13508517176729928 name module.module.external_feature_model.vit.decoder.layers.1.mlp.linear_fc2.bias lr_decay_rate 0.08862938119652507 name module.module.external_feature_model.vit.decoder.layers.0.mlp.linear_fc1.bias lr_decay_rate 0.07976644307687256_get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.input_layernorm.weight key (0.0, 0.00984770902183612, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.pre_mlp_layernorm.bias key (0.0, 0.013508517176729929, False, False) name module.module.external_feature_model.vit.decoder.layers.0.self_attention.linear_proj.weight lr_decay_rate 0.07976644307687256 name module.module.external_feature_model.vit.decoder.layers.1.pre_mlp_layernorm.weight lr_decay_rate 0.08862938119652507_get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.self_attention.linear_proj.weight key (1.0, 0.008862938119652507, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.input_layernorm.weight key (0.0, 0.007976644307687256, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.mlp.linear_fc2.bias key (0.0, 0.008862938119652507, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.mlp.linear_fc1.bias key (0.0, 0.007976644307687256, False, False)name module.module.external_feature_model.vit.decoder.layers.2.input_layernorm.bias lr_decay_rate 0.09847709021836118 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.self_attention.linear_proj.weight key (1.0, 0.007976644307687256, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.pre_mlp_layernorm.weight key (0.0, 0.008862938119652507, False, False) name module.module.external_feature_model.vit.decoder.layers.1.self_attention.linear_proj.bias lr_decay_rate 0.08862938119652507name module.module.external_feature_model.vit.decoder.layers.5.mlp.linear_fc1.weight lr_decay_rate 0.13508517176729928 name module.module.external_feature_model.vit.decoder.layers.0.input_layernorm.bias lr_decay_rate 0.07976644307687256name module.module.external_feature_model.vit.decoder.layers.2.ls1 lr_decay_rate 0.09847709021836118 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.input_layernorm.bias key (0.0, 0.00984770902183612, False, False)name module.module.external_feature_model.vit.decoder.layers.0.mlp.linear_fc2.weight lr_decay_rate 0.07976644307687256 name module.module.external_feature_model.vit.decoder.layers.0.self_attention.linear_proj.bias lr_decay_rate 0.07976644307687256name module.module.external_feature_model.vit.decoder.layers.1.pre_mlp_layernorm.bias lr_decay_rate 0.08862938119652507 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.self_attention.linear_proj.bias key (0.0, 0.008862938119652507, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.mlp.linear_fc1.weight key (1.0, 0.013508517176729929, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.input_layernorm.bias key (0.0, 0.007976644307687256, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.ls1 key (0.0, 0.00984770902183612, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.mlp.linear_fc2.weight key (1.0, 0.007976644307687256, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.pre_mlp_layernorm.bias key (0.0, 0.008862938119652507, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.self_attention.linear_proj.bias key (0.0, 0.007976644307687256, False, False) name module.module.external_feature_model.vit.decoder.layers.5.mlp.linear_fc1.bias lr_decay_rate 0.13508517176729928name module.module.external_feature_model.vit.decoder.layers.1.self_attention.linear_qkv.weight lr_decay_rate 0.08862938119652507name module.module.external_feature_model.vit.decoder.layers.2.self_attention.linear_proj.weight lr_decay_rate 0.09847709021836118name module.module.external_feature_model.vit.decoder.layers.2.ls2 lr_decay_rate 0.09847709021836118 name module.module.external_feature_model.vit.decoder.layers.0.mlp.linear_fc2.bias lr_decay_rate 0.07976644307687256 name module.module.external_feature_model.vit.decoder.layers.1.mlp.linear_fc1.weight lr_decay_rate 0.08862938119652507 name module.module.external_feature_model.vit.decoder.layers.0.self_attention.linear_qkv.weight lr_decay_rate 0.07976644307687256name module.module.external_feature_model.vit.decoder.layers.0.self_attention.linear_proj.weight lr_decay_rate 0.07976644307687256 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.mlp.linear_fc1.bias key (0.0, 0.013508517176729929, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.self_attention.linear_proj.weight key (1.0, 0.00984770902183612, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.mlp.linear_fc2.bias key (0.0, 0.007976644307687256, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.ls2 key (0.0, 0.00984770902183612, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.self_attention.linear_qkv.weight key (1.0, 0.007976644307687256, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.self_attention.linear_qkv.weight key (1.0, 0.008862938119652507, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.mlp.linear_fc1.weight key (1.0, 0.008862938119652507, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.self_attention.linear_proj.weight key (1.0, 0.007976644307687256, False, False) name module.module.external_feature_model.vit.decoder.layers.5.mlp.linear_fc2.weight lr_decay_rate 0.13508517176729928 name module.module.external_feature_model.vit.decoder.layers.2.self_attention.linear_proj.bias lr_decay_rate 0.09847709021836118 name module.module.external_feature_model.vit.decoder.layers.0.self_attention.linear_qkv.bias lr_decay_rate 0.07976644307687256 name module.module.external_feature_model.vit.decoder.layers.1.mlp.linear_fc1.bias lr_decay_rate 0.08862938119652507name module.module.external_feature_model.vit.decoder.layers.2.input_layernorm.weight lr_decay_rate 0.09847709021836118 name module.module.external_feature_model.vit.decoder.layers.0.self_attention.linear_proj.bias lr_decay_rate 0.07976644307687256name module.module.external_feature_model.vit.decoder.layers.1.ls1 lr_decay_rate 0.08862938119652507name module.module.external_feature_model.vit.decoder.layers.1.self_attention.linear_qkv.bias lr_decay_rate 0.08862938119652507_get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.mlp.linear_fc2.weight key (1.0, 0.013508517176729929, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.self_attention.linear_proj.bias key (0.0, 0.00984770902183612, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.self_attention.linear_qkv.bias key (0.0, 0.007976644307687256, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.mlp.linear_fc1.bias key (0.0, 0.008862938119652507, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.input_layernorm.weight key (0.0, 0.00984770902183612, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.self_attention.linear_proj.bias key (0.0, 0.007976644307687256, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.ls1 key (0.0, 0.008862938119652507, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.self_attention.linear_qkv.bias key (0.0, 0.008862938119652507, False, False)name module.module.external_feature_model.vit.decoder.layers.5.mlp.linear_fc2.bias lr_decay_rate 0.13508517176729928 name module.module.external_feature_model.vit.decoder.layers.2.self_attention.linear_qkv.weight lr_decay_rate 0.09847709021836118 name module.module.external_feature_model.vit.decoder.layers.1.mlp.linear_fc2.weight lr_decay_rate 0.08862938119652507name module.module.external_feature_model.vit.decoder.layers.2.input_layernorm.bias lr_decay_rate 0.09847709021836118 name module.module.external_feature_model.vit.decoder.layers.0.pre_mlp_layernorm.weight lr_decay_rate 0.07976644307687256 name module.module.external_feature_model.vit.decoder.layers.1.ls2 lr_decay_rate 0.08862938119652507_get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.mlp.linear_fc2.bias key (0.0, 0.013508517176729929, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.self_attention.linear_qkv.weight key (1.0, 0.00984770902183612, False, False)name module.module.external_feature_model.vit.decoder.layers.0.self_attention.linear_qkv.weight lr_decay_rate 0.07976644307687256 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.input_layernorm.bias key (0.0, 0.00984770902183612, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.mlp.linear_fc2.weight key (1.0, 0.008862938119652507, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.pre_mlp_layernorm.weight key (0.0, 0.007976644307687256, False, False) name module.module.external_feature_model.vit.decoder.layers.1.pre_mlp_layernorm.weight lr_decay_rate 0.08862938119652507 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.ls2 key (0.0, 0.008862938119652507, False, False) name module.module.external_feature_model.vit.decoder.layers.2.self_attention.linear_qkv.bias lr_decay_rate 0.09847709021836118 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.self_attention.linear_qkv.weight key (1.0, 0.007976644307687256, False, False) name module.module.external_feature_model.vit.decoder.layers.6.ls1 lr_decay_rate 0.15009463529699918 name module.module.external_feature_model.vit.decoder.layers.1.mlp.linear_fc2.bias lr_decay_rate 0.08862938119652507 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.pre_mlp_layernorm.weight key (0.0, 0.008862938119652507, False, False)name module.module.external_feature_model.vit.decoder.layers.0.pre_mlp_layernorm.bias lr_decay_rate 0.07976644307687256 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.self_attention.linear_qkv.bias key (0.0, 0.00984770902183612, False, False)name module.module.external_feature_model.vit.decoder.layers.2.self_attention.linear_proj.weight lr_decay_rate 0.09847709021836118 name module.module.external_feature_model.vit.decoder.layers.1.input_layernorm.weight lr_decay_rate 0.08862938119652507name module.module.external_feature_model.vit.decoder.layers.0.self_attention.linear_qkv.bias lr_decay_rate 0.07976644307687256_get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.ls1 key (0.0, 0.015009463529699918, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.mlp.linear_fc2.bias key (0.0, 0.008862938119652507, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.pre_mlp_layernorm.bias key (0.0, 0.007976644307687256, False, False) name module.module.external_feature_model.vit.decoder.layers.1.pre_mlp_layernorm.bias lr_decay_rate 0.08862938119652507 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.self_attention.linear_proj.weight key (1.0, 0.00984770902183612, False, False)name module.module.external_feature_model.vit.class_token lr_decay_rate 1.0_get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.input_layernorm.weight key (0.0, 0.008862938119652507, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.self_attention.linear_qkv.bias key (0.0, 0.007976644307687256, False, False) name module.module.external_feature_model.vit.class_token lr_decay_rate 1.0 name module.module.external_feature_model.vit.decoder.layers.2.ls1 lr_decay_rate 0.09847709021836118name module.module.external_feature_model.vit.decoder.layers.6.ls2 lr_decay_rate 0.15009463529699918 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.pre_mlp_layernorm.bias key (0.0, 0.008862938119652507, False, False) name module.module.external_feature_model.vit.decoder.layers.2.pre_mlp_layernorm.weight lr_decay_rate 0.09847709021836118name module.module.external_feature_model.vit.decoder.layers.0.mlp.linear_fc1.weight lr_decay_rate 0.07976644307687256 name module.module.external_feature_model.vit.decoder.layers.2.self_attention.linear_proj.bias lr_decay_rate 0.09847709021836118name module.module.external_feature_model.vit.decoder.layers.1.input_layernorm.bias lr_decay_rate 0.08862938119652507 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.mlp.linear_fc1.weight key (1.0, 0.007976644307687256, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.ls2 key (0.0, 0.015009463529699918, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.ls1 key (0.0, 0.00984770902183612, False, False) name module.module.external_feature_model.vit.decoder.layers.1.mlp.linear_fc1.weight lr_decay_rate 0.08862938119652507_get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.input_layernorm.bias key (0.0, 0.008862938119652507, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.pre_mlp_layernorm.weight key (0.0, 0.00984770902183612, False, False)name module.module.external_feature_model.vit.decoder.layers.0.pre_mlp_layernorm.weight lr_decay_rate 0.07976644307687256_get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.self_attention.linear_proj.bias key (0.0, 0.00984770902183612, False, False) name module.module.external_feature_model.vit.decoder.layers.0.mlp.linear_fc1.bias lr_decay_rate 0.07976644307687256 name module.module.external_feature_model.vit.decoder.layers.2.ls2 lr_decay_rate 0.09847709021836118 name module.module.external_feature_model.vit.decoder.layers.6.input_layernorm.weight lr_decay_rate 0.15009463529699918 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.pre_mlp_layernorm.weight key (0.0, 0.007976644307687256, False, False)name module.module.external_feature_model.vit.decoder.layers.2.pre_mlp_layernorm.bias lr_decay_rate 0.09847709021836118 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.mlp.linear_fc1.weight key (1.0, 0.008862938119652507, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.mlp.linear_fc1.bias key (0.0, 0.007976644307687256, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.ls2 key (0.0, 0.00984770902183612, False, False)name module.module.external_feature_model.vit.decoder.layers.2.self_attention.linear_qkv.weight lr_decay_rate 0.09847709021836118_get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.input_layernorm.weight key (0.0, 0.015009463529699918, False, False) name module.module.external_feature_model.vit.decoder.layers.1.self_attention.linear_proj.weight lr_decay_rate 0.08862938119652507 name module.module.external_feature_model.vit.decoder.layers.0.pre_mlp_layernorm.bias lr_decay_rate 0.07976644307687256_get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.pre_mlp_layernorm.bias key (0.0, 0.00984770902183612, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.self_attention.linear_qkv.weight key (1.0, 0.00984770902183612, False, False) name module.module.external_feature_model.vit.decoder.layers.6.input_layernorm.bias lr_decay_rate 0.15009463529699918 name module.module.external_feature_model.vit.decoder.layers.1.mlp.linear_fc1.bias lr_decay_rate 0.08862938119652507 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.self_attention.linear_proj.weight key (1.0, 0.008862938119652507, False, False)name module.module.external_feature_model.vit.decoder.layers.0.mlp.linear_fc2.weight lr_decay_rate 0.07976644307687256name module.module.external_feature_model.vit.decoder.layers.2.input_layernorm.weight lr_decay_rate 0.09847709021836118 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.pre_mlp_layernorm.bias key (0.0, 0.007976644307687256, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.input_layernorm.bias key (0.0, 0.015009463529699918, False, False)name module.module.external_feature_model.vit.decoder.layers.2.mlp.linear_fc1.weight lr_decay_rate 0.09847709021836118 name module.module.external_feature_model.vit.decoder.layers.2.self_attention.linear_qkv.bias lr_decay_rate 0.09847709021836118 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.mlp.linear_fc1.bias key (0.0, 0.008862938119652507, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.mlp.linear_fc2.weight key (1.0, 0.007976644307687256, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.input_layernorm.weight key (0.0, 0.00984770902183612, False, False) name module.module.external_feature_model.vit.decoder.layers.1.self_attention.linear_proj.bias lr_decay_rate 0.08862938119652507 name module.module.external_feature_model.vit.decoder.layers.0.mlp.linear_fc1.weight lr_decay_rate 0.07976644307687256_get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.mlp.linear_fc1.weight key (1.0, 0.00984770902183612, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.self_attention.linear_qkv.bias key (0.0, 0.00984770902183612, False, False) name module.module.external_feature_model.vit.decoder.layers.0.mlp.linear_fc2.bias lr_decay_rate 0.07976644307687256name module.module.external_feature_model.vit.decoder.layers.6.self_attention.linear_proj.weight lr_decay_rate 0.15009463529699918 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.self_attention.linear_proj.bias key (0.0, 0.008862938119652507, False, False)name module.module.external_feature_model.vit.decoder.layers.1.mlp.linear_fc2.weight lr_decay_rate 0.08862938119652507name module.module.external_feature_model.vit.decoder.layers.2.input_layernorm.bias lr_decay_rate 0.09847709021836118 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.mlp.linear_fc1.weight key (1.0, 0.007976644307687256, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.mlp.linear_fc2.bias key (0.0, 0.007976644307687256, False, False) name module.module.external_feature_model.vit.decoder.layers.2.mlp.linear_fc1.bias lr_decay_rate 0.09847709021836118 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.self_attention.linear_proj.weight key (1.0, 0.015009463529699918, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.input_layernorm.bias key (0.0, 0.00984770902183612, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.mlp.linear_fc2.weight key (1.0, 0.008862938119652507, False, False) name module.module.external_feature_model.vit.decoder.layers.2.pre_mlp_layernorm.weight lr_decay_rate 0.09847709021836118 name module.module.external_feature_model.vit.decoder.layers.1.self_attention.linear_qkv.weight lr_decay_rate 0.08862938119652507 name module.module.external_feature_model.vit.decoder.layers.0.mlp.linear_fc1.bias lr_decay_rate 0.07976644307687256_get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.mlp.linear_fc1.bias key (0.0, 0.00984770902183612, False, False) name module.module.external_feature_model.vit.decoder.layers.1.ls1 lr_decay_rate 0.08862938119652507name module.module.external_feature_model.vit.decoder.layers.6.self_attention.linear_proj.bias lr_decay_rate 0.15009463529699918 name module.module.external_feature_model.vit.decoder.layers.1.mlp.linear_fc2.bias lr_decay_rate 0.08862938119652507 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.self_attention.linear_qkv.weight key (1.0, 0.008862938119652507, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.pre_mlp_layernorm.weight key (0.0, 0.00984770902183612, False, False)_get_param_groups name module.module.external_feature_model.vit.class_token key (1.0, 0.1, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.mlp.linear_fc1.bias key (0.0, 0.007976644307687256, False, False) name module.module.external_feature_model.vit.decoder.layers.2.self_attention.linear_proj.weight lr_decay_rate 0.09847709021836118_get_param_groups name module.module.external_feature_model.vit.class_token key (1.0, 0.1, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.self_attention.linear_proj.bias key (0.0, 0.015009463529699918, False, False) name module.module.external_feature_model.vit.decoder.layers.2.mlp.linear_fc2.weight lr_decay_rate 0.09847709021836118_get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.ls1 key (0.0, 0.008862938119652507, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.mlp.linear_fc2.bias key (0.0, 0.008862938119652507, False, False) name module.module.external_feature_model.vit.decoder.layers.1.self_attention.linear_qkv.bias lr_decay_rate 0.08862938119652507name module.module.external_feature_model.vit.decoder.layers.2.pre_mlp_layernorm.bias lr_decay_rate 0.09847709021836118 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.self_attention.linear_proj.weight key (1.0, 0.00984770902183612, False, False) name module.module.external_feature_model.vit.decoder.layers.0.mlp.linear_fc2.weight lr_decay_rate 0.07976644307687256 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.mlp.linear_fc2.weight key (1.0, 0.00984770902183612, False, False)name module.module.external_feature_model.vit.decoder.layers.1.ls2 lr_decay_rate 0.08862938119652507_get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.self_attention.linear_qkv.bias key (0.0, 0.008862938119652507, False, False)name module.module.external_feature_model.vit.decoder.layers.6.self_attention.linear_qkv.weight lr_decay_rate 0.15009463529699918 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.pre_mlp_layernorm.bias key (0.0, 0.00984770902183612, False, False) name module.module.external_feature_model.vit.decoder.layers.2.ls1 lr_decay_rate 0.09847709021836118_get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.mlp.linear_fc2.weight key (1.0, 0.007976644307687256, False, False) name module.module.external_feature_model.vit.conv1.weight lr_decay_rate 0.0717897987691853name module.module.external_feature_model.vit.decoder.layers.2.self_attention.linear_proj.bias lr_decay_rate 0.09847709021836118 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.ls2 key (0.0, 0.008862938119652507, False, False) name module.module.external_feature_model.vit.conv1.weight lr_decay_rate 0.0717897987691853 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.self_attention.linear_qkv.weight key (1.0, 0.015009463529699918, False, False)name module.module.external_feature_model.vit.decoder.layers.2.mlp.linear_fc2.bias lr_decay_rate 0.09847709021836118 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.self_attention.linear_proj.bias key (0.0, 0.00984770902183612, False, False) name module.module.external_feature_model.vit.decoder.layers.1.pre_mlp_layernorm.weight lr_decay_rate 0.08862938119652507 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.ls1 key (0.0, 0.00984770902183612, False, False)name module.module.external_feature_model.vit.decoder.layers.0.mlp.linear_fc2.bias lr_decay_rate 0.07976644307687256 name module.module.external_feature_model.vit.decoder.layers.2.mlp.linear_fc1.weight lr_decay_rate 0.09847709021836118 _get_param_groups name module.module.external_feature_model.vit.conv1.weight key (1.0, 0.00717897987691853, False, False)name module.module.external_feature_model.vit.decoder.layers.1.input_layernorm.weight lr_decay_rate 0.08862938119652507 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.mlp.linear_fc2.bias key (0.0, 0.00984770902183612, False, False)_get_param_groups name module.module.external_feature_model.vit.conv1.weight key (1.0, 0.00717897987691853, False, False)name module.module.external_feature_model.vit.decoder.layers.6.self_attention.linear_qkv.bias lr_decay_rate 0.15009463529699918 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.mlp.linear_fc2.bias key (0.0, 0.007976644307687256, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.pre_mlp_layernorm.weight key (0.0, 0.008862938119652507, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.mlp.linear_fc1.weight key (1.0, 0.00984770902183612, False, False) name module.module.external_feature_model.vit.decoder.layers.2.ls2 lr_decay_rate 0.09847709021836118 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.input_layernorm.weight key (0.0, 0.008862938119652507, False, False)name module.module.external_feature_model.vit.decoder.layers.2.self_attention.linear_qkv.weight lr_decay_rate 0.09847709021836118name module.module.external_feature_model.vit.conv1.bias lr_decay_rate 0.0717897987691853 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.self_attention.linear_qkv.bias key (0.0, 0.015009463529699918, False, False) name module.module.external_feature_model.vit.conv1.bias lr_decay_rate 0.0717897987691853name module.module.external_feature_model.vit.decoder.layers.3.ls1 lr_decay_rate 0.10941898913151242 name module.module.external_feature_model.vit.decoder.layers.2.mlp.linear_fc1.bias lr_decay_rate 0.09847709021836118name module.module.external_feature_model.vit.decoder.layers.1.pre_mlp_layernorm.bias lr_decay_rate 0.08862938119652507 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.ls2 key (0.0, 0.00984770902183612, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.self_attention.linear_qkv.weight key (1.0, 0.00984770902183612, False, False) _get_param_groups name module.module.external_feature_model.vit.conv1.bias key (0.0, 0.00717897987691853, False, False) name module.module.external_feature_model.vit.decoder.layers.1.input_layernorm.bias lr_decay_rate 0.08862938119652507 name module.module.external_feature_model.vit.decoder.layers.1.ls1 lr_decay_rate 0.08862938119652507 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.ls1 key (0.0, 0.010941898913151242, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.mlp.linear_fc1.bias key (0.0, 0.00984770902183612, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.pre_mlp_layernorm.bias key (0.0, 0.008862938119652507, False, False)_get_param_groups name module.module.external_feature_model.vit.conv1.bias key (0.0, 0.00717897987691853, False, False) name module.module.external_feature_model.vit.decoder.layers.6.pre_mlp_layernorm.weight lr_decay_rate 0.15009463529699918 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.input_layernorm.bias key (0.0, 0.008862938119652507, False, False)name module.module.external_feature_model.vit.decoder.layers.2.self_attention.linear_qkv.bias lr_decay_rate 0.09847709021836118 name module.module.external_feature_model.vit.decoder.layers.2.input_layernorm.weight lr_decay_rate 0.09847709021836118_get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.ls1 key (0.0, 0.008862938119652507, False, False) name module.module.external_feature_model.vit.position_embeddings.weight lr_decay_rate 0.0717897987691853name module.module.external_feature_model.vit.decoder.layers.3.ls2 lr_decay_rate 0.10941898913151242 name module.module.external_feature_model.vit.decoder.layers.1.mlp.linear_fc1.weight lr_decay_rate 0.08862938119652507 name module.module.external_feature_model.vit.decoder.layers.2.mlp.linear_fc2.weight lr_decay_rate 0.09847709021836118 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.pre_mlp_layernorm.weight key (0.0, 0.015009463529699918, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.self_attention.linear_qkv.bias key (0.0, 0.00984770902183612, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.input_layernorm.weight key (0.0, 0.00984770902183612, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.ls2 key (0.0, 0.010941898913151242, False, False)name module.module.external_feature_model.vit.position_embeddings.weight lr_decay_rate 0.0717897987691853 _get_param_groups name module.module.external_feature_model.vit.position_embeddings.weight key (1.0, 0.00717897987691853, False, False) name module.module.external_feature_model.vit.decoder.layers.1.ls2 lr_decay_rate 0.08862938119652507name module.module.external_feature_model.vit.decoder.layers.1.self_attention.linear_proj.weight lr_decay_rate 0.08862938119652507_get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.mlp.linear_fc1.weight key (1.0, 0.008862938119652507, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.mlp.linear_fc2.weight key (1.0, 0.00984770902183612, False, False) name module.module.external_feature_model.vit.decoder.layers.6.pre_mlp_layernorm.bias lr_decay_rate 0.15009463529699918 name module.module.external_feature_model.vit.decoder.layers.2.input_layernorm.bias lr_decay_rate 0.09847709021836118 _get_param_groups name module.module.external_feature_model.vit.position_embeddings.weight key (1.0, 0.00717897987691853, False, False)name module.module.external_feature_model.vit.decoder.layers.2.pre_mlp_layernorm.weight lr_decay_rate 0.09847709021836118 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.self_attention.linear_proj.weight key (1.0, 0.008862938119652507, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.ls2 key (0.0, 0.008862938119652507, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.pre_mlp_layernorm.bias key (0.0, 0.015009463529699918, False, False)name module.module.external_feature_model.vit.decoder.layers.2.mlp.linear_fc2.bias lr_decay_rate 0.09847709021836118name module.module.external_feature_model.vit.decoder.layers.1.mlp.linear_fc1.bias lr_decay_rate 0.08862938119652507name module.module.external_feature_model.vit.decoder.layers.3.input_layernorm.weight lr_decay_rate 0.10941898913151242_get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.input_layernorm.bias key (0.0, 0.00984770902183612, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.pre_mlp_layernorm.weight key (0.0, 0.00984770902183612, False, False) name module.module.external_feature_model.vit.decoder.layers.0.ls1 lr_decay_rate 0.07976644307687256name module.module.external_feature_model.vit.decoder.layers.1.self_attention.linear_proj.bias lr_decay_rate 0.08862938119652507 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.mlp.linear_fc1.bias key (0.0, 0.008862938119652507, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.mlp.linear_fc2.bias key (0.0, 0.00984770902183612, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.input_layernorm.weight key (0.0, 0.010941898913151242, False, False) name module.module.external_feature_model.vit.decoder.layers.1.input_layernorm.weight lr_decay_rate 0.08862938119652507 name module.module.external_feature_model.vit.decoder.layers.6.mlp.linear_fc1.weight lr_decay_rate 0.15009463529699918 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.self_attention.linear_proj.bias key (0.0, 0.008862938119652507, False, False)name module.module.external_feature_model.vit.decoder.layers.2.pre_mlp_layernorm.bias lr_decay_rate 0.09847709021836118 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.ls1 key (0.0, 0.007976644307687256, False, False)name module.module.external_feature_model.vit.decoder.layers.0.ls1 lr_decay_rate 0.07976644307687256 name module.module.external_feature_model.vit.decoder.layers.2.self_attention.linear_proj.weight lr_decay_rate 0.09847709021836118name module.module.external_feature_model.vit.decoder.layers.1.mlp.linear_fc2.weight lr_decay_rate 0.08862938119652507 name module.module.external_feature_model.vit.decoder.layers.3.input_layernorm.bias lr_decay_rate 0.10941898913151242_get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.input_layernorm.weight key (0.0, 0.008862938119652507, False, False)name module.module.external_feature_model.vit.decoder.layers.3.ls1 lr_decay_rate 0.10941898913151242 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.pre_mlp_layernorm.bias key (0.0, 0.00984770902183612, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.mlp.linear_fc1.weight key (1.0, 0.015009463529699918, False, False) name module.module.external_feature_model.vit.decoder.layers.1.self_attention.linear_qkv.weight lr_decay_rate 0.08862938119652507 name module.module.external_feature_model.vit.decoder.layers.0.ls2 lr_decay_rate 0.07976644307687256 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.ls1 key (0.0, 0.007976644307687256, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.self_attention.linear_proj.weight key (1.0, 0.00984770902183612, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.mlp.linear_fc2.weight key (1.0, 0.008862938119652507, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.input_layernorm.bias key (0.0, 0.010941898913151242, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.ls1 key (0.0, 0.010941898913151242, False, False) name module.module.external_feature_model.vit.decoder.layers.6.mlp.linear_fc1.bias lr_decay_rate 0.15009463529699918name module.module.external_feature_model.vit.decoder.layers.1.input_layernorm.bias lr_decay_rate 0.08862938119652507_get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.self_attention.linear_qkv.weight key (1.0, 0.008862938119652507, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.ls2 key (0.0, 0.007976644307687256, False, False) name module.module.external_feature_model.vit.decoder.layers.2.mlp.linear_fc1.weight lr_decay_rate 0.09847709021836118 name module.module.external_feature_model.vit.decoder.layers.2.self_attention.linear_proj.bias lr_decay_rate 0.09847709021836118name module.module.external_feature_model.vit.decoder.layers.0.ls2 lr_decay_rate 0.07976644307687256name module.module.external_feature_model.vit.decoder.layers.1.mlp.linear_fc2.bias lr_decay_rate 0.08862938119652507 name module.module.external_feature_model.vit.decoder.layers.3.ls2 lr_decay_rate 0.10941898913151242_get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.mlp.linear_fc1.bias key (0.0, 0.015009463529699918, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.input_layernorm.bias key (0.0, 0.008862938119652507, False, False)name module.module.external_feature_model.vit.decoder.layers.1.self_attention.linear_qkv.bias lr_decay_rate 0.08862938119652507name module.module.external_feature_model.vit.decoder.layers.3.self_attention.linear_proj.weight lr_decay_rate 0.10941898913151242 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.self_attention.linear_proj.bias key (0.0, 0.00984770902183612, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.mlp.linear_fc1.weight key (1.0, 0.00984770902183612, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.mlp.linear_fc2.bias key (0.0, 0.008862938119652507, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.ls2 key (0.0, 0.010941898913151242, False, False) name module.module.external_feature_model.vit.decoder.layers.0.input_layernorm.weight lr_decay_rate 0.07976644307687256_get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.ls2 key (0.0, 0.007976644307687256, False, False) name module.module.external_feature_model.vit.decoder.layers.6.mlp.linear_fc2.weight lr_decay_rate 0.15009463529699918_get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.self_attention.linear_qkv.bias key (0.0, 0.008862938119652507, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.self_attention.linear_proj.weight key (1.0, 0.010941898913151242, False, False) name module.module.external_feature_model.vit.decoder.layers.2.mlp.linear_fc1.bias lr_decay_rate 0.09847709021836118name module.module.external_feature_model.vit.decoder.layers.2.self_attention.linear_qkv.weight lr_decay_rate 0.09847709021836118 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.input_layernorm.weight key (0.0, 0.007976644307687256, False, False)name module.module.external_feature_model.vit.decoder.layers.1.self_attention.linear_proj.weight lr_decay_rate 0.08862938119652507 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.mlp.linear_fc2.weight key (1.0, 0.015009463529699918, False, False) name module.module.external_feature_model.vit.decoder.layers.3.input_layernorm.weight lr_decay_rate 0.10941898913151242name module.module.external_feature_model.vit.decoder.layers.2.ls1 lr_decay_rate 0.09847709021836118 name module.module.external_feature_model.vit.decoder.layers.3.self_attention.linear_proj.bias lr_decay_rate 0.10941898913151242name module.module.external_feature_model.vit.decoder.layers.0.input_layernorm.weight lr_decay_rate 0.07976644307687256 name module.module.external_feature_model.vit.decoder.layers.1.pre_mlp_layernorm.weight lr_decay_rate 0.08862938119652507_get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.self_attention.linear_qkv.weight key (1.0, 0.00984770902183612, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.mlp.linear_fc1.bias key (0.0, 0.00984770902183612, False, False) name module.module.external_feature_model.vit.decoder.layers.0.input_layernorm.bias lr_decay_rate 0.07976644307687256_get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.input_layernorm.weight key (0.0, 0.010941898913151242, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.self_attention.linear_proj.weight key (1.0, 0.008862938119652507, False, False)name module.module.external_feature_model.vit.decoder.layers.6.mlp.linear_fc2.bias lr_decay_rate 0.15009463529699918_get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.ls1 key (0.0, 0.00984770902183612, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.self_attention.linear_proj.bias key (0.0, 0.010941898913151242, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.input_layernorm.weight key (0.0, 0.007976644307687256, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.pre_mlp_layernorm.weight key (0.0, 0.008862938119652507, False, False) name module.module.external_feature_model.vit.decoder.layers.2.self_attention.linear_qkv.bias lr_decay_rate 0.09847709021836118 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.mlp.linear_fc2.bias key (0.0, 0.015009463529699918, False, False)name module.module.external_feature_model.vit.decoder.layers.2.mlp.linear_fc2.weight lr_decay_rate 0.09847709021836118_get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.input_layernorm.bias key (0.0, 0.007976644307687256, False, False) name module.module.external_feature_model.vit.decoder.layers.2.ls2 lr_decay_rate 0.09847709021836118 name module.module.external_feature_model.vit.decoder.layers.3.input_layernorm.bias lr_decay_rate 0.10941898913151242name module.module.external_feature_model.vit.decoder.layers.1.self_attention.linear_proj.bias lr_decay_rate 0.08862938119652507 name module.module.external_feature_model.vit.decoder.layers.3.self_attention.linear_qkv.weight lr_decay_rate 0.10941898913151242 name module.module.external_feature_model.vit.decoder.layers.1.pre_mlp_layernorm.bias lr_decay_rate 0.08862938119652507name module.module.external_feature_model.vit.decoder.layers.0.input_layernorm.bias lr_decay_rate 0.07976644307687256 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.mlp.linear_fc2.weight key (1.0, 0.00984770902183612, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.self_attention.linear_qkv.bias key (0.0, 0.00984770902183612, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.input_layernorm.bias key (0.0, 0.010941898913151242, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.ls2 key (0.0, 0.00984770902183612, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.self_attention.linear_proj.bias key (0.0, 0.008862938119652507, False, False)name module.module.external_feature_model.vit.decoder.layers.7.ls1 lr_decay_rate 0.16677181699666577_get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.self_attention.linear_qkv.weight key (1.0, 0.010941898913151242, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.pre_mlp_layernorm.bias key (0.0, 0.008862938119652507, False, False) name module.module.external_feature_model.vit.decoder.layers.0.self_attention.linear_proj.weight lr_decay_rate 0.07976644307687256 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.input_layernorm.bias key (0.0, 0.007976644307687256, False, False) name module.module.external_feature_model.vit.decoder.layers.2.mlp.linear_fc2.bias lr_decay_rate 0.09847709021836118 name module.module.external_feature_model.vit.decoder.layers.2.input_layernorm.weight lr_decay_rate 0.09847709021836118_get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.ls1 key (0.0, 0.016677181699666577, False, False) name module.module.external_feature_model.vit.decoder.layers.2.pre_mlp_layernorm.weight lr_decay_rate 0.09847709021836118name module.module.external_feature_model.vit.decoder.layers.3.self_attention.linear_proj.weight lr_decay_rate 0.10941898913151242name module.module.external_feature_model.vit.decoder.layers.3.self_attention.linear_qkv.bias lr_decay_rate 0.10941898913151242_get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.mlp.linear_fc2.bias key (0.0, 0.00984770902183612, False, False)name module.module.external_feature_model.vit.decoder.layers.1.self_attention.linear_qkv.weight lr_decay_rate 0.08862938119652507 name module.module.external_feature_model.vit.decoder.layers.1.mlp.linear_fc1.weight lr_decay_rate 0.08862938119652507 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.self_attention.linear_proj.weight key (1.0, 0.007976644307687256, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.input_layernorm.weight key (0.0, 0.00984770902183612, False, False) name module.module.external_feature_model.vit.decoder.layers.0.self_attention.linear_proj.weight lr_decay_rate 0.07976644307687256 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.self_attention.linear_qkv.bias key (0.0, 0.010941898913151242, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.mlp.linear_fc1.weight key (1.0, 0.008862938119652507, False, False) name module.module.external_feature_model.vit.decoder.layers.7.ls2 lr_decay_rate 0.16677181699666577 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.pre_mlp_layernorm.weight key (0.0, 0.00984770902183612, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.self_attention.linear_proj.weight key (1.0, 0.010941898913151242, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.self_attention.linear_qkv.weight key (1.0, 0.008862938119652507, False, False) name module.module.external_feature_model.vit.decoder.layers.2.input_layernorm.bias lr_decay_rate 0.09847709021836118 name module.module.external_feature_model.vit.decoder.layers.0.self_attention.linear_proj.bias lr_decay_rate 0.07976644307687256name module.module.external_feature_model.vit.decoder.layers.3.ls1 lr_decay_rate 0.10941898913151242 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.self_attention.linear_proj.weight key (1.0, 0.007976644307687256, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.ls2 key (0.0, 0.016677181699666577, False, False) name module.module.external_feature_model.vit.decoder.layers.1.mlp.linear_fc1.bias lr_decay_rate 0.08862938119652507 name module.module.external_feature_model.vit.decoder.layers.2.pre_mlp_layernorm.bias lr_decay_rate 0.09847709021836118name module.module.external_feature_model.vit.decoder.layers.3.pre_mlp_layernorm.weight lr_decay_rate 0.10941898913151242 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.input_layernorm.bias key (0.0, 0.00984770902183612, False, False) name module.module.external_feature_model.vit.decoder.layers.1.self_attention.linear_qkv.bias lr_decay_rate 0.08862938119652507 name module.module.external_feature_model.vit.decoder.layers.3.self_attention.linear_proj.bias lr_decay_rate 0.10941898913151242_get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.self_attention.linear_proj.bias key (0.0, 0.007976644307687256, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.mlp.linear_fc1.bias key (0.0, 0.008862938119652507, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.ls1 key (0.0, 0.010941898913151242, False, False) name module.module.external_feature_model.vit.decoder.layers.0.self_attention.linear_proj.bias lr_decay_rate 0.07976644307687256 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.pre_mlp_layernorm.bias key (0.0, 0.00984770902183612, False, False)name module.module.external_feature_model.vit.decoder.layers.7.input_layernorm.weight lr_decay_rate 0.16677181699666577 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.pre_mlp_layernorm.weight key (0.0, 0.010941898913151242, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.self_attention.linear_qkv.bias key (0.0, 0.008862938119652507, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.self_attention.linear_proj.bias key (0.0, 0.010941898913151242, False, False) name module.module.external_feature_model.vit.decoder.layers.0.self_attention.linear_qkv.weight lr_decay_rate 0.07976644307687256 name module.module.external_feature_model.vit.decoder.layers.2.self_attention.linear_proj.weight lr_decay_rate 0.09847709021836118 name module.module.external_feature_model.vit.decoder.layers.1.mlp.linear_fc2.weight lr_decay_rate 0.08862938119652507_get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.self_attention.linear_proj.bias key (0.0, 0.007976644307687256, False, False)name module.module.external_feature_model.vit.decoder.layers.3.ls2 lr_decay_rate 0.10941898913151242 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.input_layernorm.weight key (0.0, 0.016677181699666577, False, False)name module.module.external_feature_model.vit.decoder.layers.2.mlp.linear_fc1.weight lr_decay_rate 0.09847709021836118 name module.module.external_feature_model.vit.decoder.layers.3.pre_mlp_layernorm.bias lr_decay_rate 0.10941898913151242_get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.self_attention.linear_qkv.weight key (1.0, 0.007976644307687256, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.self_attention.linear_proj.weight key (1.0, 0.00984770902183612, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.mlp.linear_fc2.weight key (1.0, 0.008862938119652507, False, False)name module.module.external_feature_model.vit.decoder.layers.1.pre_mlp_layernorm.weight lr_decay_rate 0.08862938119652507name module.module.external_feature_model.vit.decoder.layers.3.self_attention.linear_qkv.weight lr_decay_rate 0.10941898913151242 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.ls2 key (0.0, 0.010941898913151242, False, False) name module.module.external_feature_model.vit.decoder.layers.0.self_attention.linear_qkv.weight lr_decay_rate 0.07976644307687256_get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.mlp.linear_fc1.weight key (1.0, 0.00984770902183612, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.pre_mlp_layernorm.bias key (0.0, 0.010941898913151242, False, False)name module.module.external_feature_model.vit.decoder.layers.7.input_layernorm.bias lr_decay_rate 0.16677181699666577 name module.module.external_feature_model.vit.decoder.layers.0.self_attention.linear_qkv.bias lr_decay_rate 0.07976644307687256 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.self_attention.linear_qkv.weight key (1.0, 0.010941898913151242, False, False) name module.module.external_feature_model.vit.decoder.layers.1.mlp.linear_fc2.bias lr_decay_rate 0.08862938119652507_get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.pre_mlp_layernorm.weight key (0.0, 0.008862938119652507, False, False)name module.module.external_feature_model.vit.decoder.layers.2.self_attention.linear_proj.bias lr_decay_rate 0.09847709021836118 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.self_attention.linear_qkv.weight key (1.0, 0.007976644307687256, False, False)name module.module.external_feature_model.vit.decoder.layers.3.input_layernorm.weight lr_decay_rate 0.10941898913151242 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.input_layernorm.bias key (0.0, 0.016677181699666577, False, False)name module.module.external_feature_model.vit.decoder.layers.2.mlp.linear_fc1.bias lr_decay_rate 0.09847709021836118 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.self_attention.linear_qkv.bias key (0.0, 0.007976644307687256, False, False) name module.module.external_feature_model.vit.decoder.layers.3.mlp.linear_fc1.weight lr_decay_rate 0.10941898913151242 name module.module.external_feature_model.vit.decoder.layers.3.self_attention.linear_qkv.bias lr_decay_rate 0.10941898913151242_get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.mlp.linear_fc2.bias key (0.0, 0.008862938119652507, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.self_attention.linear_proj.bias key (0.0, 0.00984770902183612, False, False) name module.module.external_feature_model.vit.decoder.layers.1.pre_mlp_layernorm.bias lr_decay_rate 0.08862938119652507 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.mlp.linear_fc1.bias key (0.0, 0.00984770902183612, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.input_layernorm.weight key (0.0, 0.010941898913151242, False, False)name module.module.external_feature_model.vit.decoder.layers.0.self_attention.linear_qkv.bias lr_decay_rate 0.07976644307687256 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.mlp.linear_fc1.weight key (1.0, 0.010941898913151242, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.self_attention.linear_qkv.bias key (0.0, 0.010941898913151242, False, False) name module.module.external_feature_model.vit.decoder.layers.7.self_attention.linear_proj.weight lr_decay_rate 0.16677181699666577 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.pre_mlp_layernorm.bias key (0.0, 0.008862938119652507, False, False) name module.module.external_feature_model.vit.decoder.layers.2.self_attention.linear_qkv.weight lr_decay_rate 0.09847709021836118 name module.module.external_feature_model.vit.decoder.layers.0.pre_mlp_layernorm.weight lr_decay_rate 0.07976644307687256name module.module.external_feature_model.vit.decoder.layers.2.ls1 lr_decay_rate 0.09847709021836118 name module.module.external_feature_model.vit.decoder.layers.2.mlp.linear_fc2.weight lr_decay_rate 0.09847709021836118_get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.self_attention.linear_qkv.bias key (0.0, 0.007976644307687256, False, False)name module.module.external_feature_model.vit.decoder.layers.3.input_layernorm.bias lr_decay_rate 0.10941898913151242 name module.module.external_feature_model.vit.decoder.layers.3.mlp.linear_fc1.bias lr_decay_rate 0.10941898913151242 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.self_attention.linear_proj.weight key (1.0, 0.016677181699666577, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.self_attention.linear_qkv.weight key (1.0, 0.00984770902183612, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.pre_mlp_layernorm.weight key (0.0, 0.007976644307687256, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.ls1 key (0.0, 0.00984770902183612, False, False)name module.module.external_feature_model.vit.decoder.layers.1.mlp.linear_fc1.weight lr_decay_rate 0.08862938119652507name module.module.external_feature_model.vit.decoder.layers.3.pre_mlp_layernorm.weight lr_decay_rate 0.10941898913151242 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.input_layernorm.bias key (0.0, 0.010941898913151242, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.mlp.linear_fc1.bias key (0.0, 0.010941898913151242, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.mlp.linear_fc2.weight key (1.0, 0.00984770902183612, False, False) name module.module.external_feature_model.vit.decoder.layers.7.self_attention.linear_proj.bias lr_decay_rate 0.16677181699666577name module.module.external_feature_model.vit.decoder.layers.2.self_attention.linear_qkv.bias lr_decay_rate 0.09847709021836118name module.module.external_feature_model.vit.decoder.layers.0.pre_mlp_layernorm.weight lr_decay_rate 0.07976644307687256_get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.mlp.linear_fc1.weight key (1.0, 0.008862938119652507, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.pre_mlp_layernorm.weight key (0.0, 0.010941898913151242, False, False) name module.module.external_feature_model.vit.decoder.layers.2.ls2 lr_decay_rate 0.09847709021836118 name module.module.external_feature_model.vit.decoder.layers.0.pre_mlp_layernorm.bias lr_decay_rate 0.07976644307687256 name module.module.external_feature_model.vit.decoder.layers.3.mlp.linear_fc2.weight lr_decay_rate 0.10941898913151242name module.module.external_feature_model.vit.decoder.layers.3.self_attention.linear_proj.weight lr_decay_rate 0.10941898913151242 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.self_attention.linear_proj.bias key (0.0, 0.016677181699666577, False, False)name module.module.external_feature_model.vit.decoder.layers.2.mlp.linear_fc2.bias lr_decay_rate 0.09847709021836118 name module.module.external_feature_model.vit.decoder.layers.3.pre_mlp_layernorm.bias lr_decay_rate 0.10941898913151242_get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.self_attention.linear_qkv.bias key (0.0, 0.00984770902183612, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.ls2 key (0.0, 0.00984770902183612, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.pre_mlp_layernorm.bias key (0.0, 0.007976644307687256, False, False)name module.module.external_feature_model.vit.decoder.layers.1.mlp.linear_fc1.bias lr_decay_rate 0.08862938119652507_get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.pre_mlp_layernorm.weight key (0.0, 0.007976644307687256, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.mlp.linear_fc2.weight key (1.0, 0.010941898913151242, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.self_attention.linear_proj.weight key (1.0, 0.010941898913151242, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.mlp.linear_fc2.bias key (0.0, 0.00984770902183612, False, False) name module.module.external_feature_model.vit.decoder.layers.7.self_attention.linear_qkv.weight lr_decay_rate 0.16677181699666577 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.pre_mlp_layernorm.bias key (0.0, 0.010941898913151242, False, False) name module.module.external_feature_model.vit.decoder.layers.2.pre_mlp_layernorm.weight lr_decay_rate 0.09847709021836118_get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.mlp.linear_fc1.bias key (0.0, 0.008862938119652507, False, False) name module.module.external_feature_model.vit.decoder.layers.2.input_layernorm.weight lr_decay_rate 0.09847709021836118 name module.module.external_feature_model.vit.decoder.layers.0.mlp.linear_fc1.weight lr_decay_rate 0.07976644307687256 name module.module.external_feature_model.vit.decoder.layers.0.pre_mlp_layernorm.bias lr_decay_rate 0.07976644307687256name module.module.external_feature_model.vit.decoder.layers.3.mlp.linear_fc2.bias lr_decay_rate 0.10941898913151242 name module.module.external_feature_model.vit.decoder.layers.3.self_attention.linear_proj.bias lr_decay_rate 0.10941898913151242_get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.self_attention.linear_qkv.weight key (1.0, 0.016677181699666577, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.pre_mlp_layernorm.weight key (0.0, 0.00984770902183612, False, False)name module.module.external_feature_model.vit.decoder.layers.3.mlp.linear_fc1.weight lr_decay_rate 0.10941898913151242_get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.input_layernorm.weight key (0.0, 0.00984770902183612, False, False) name module.module.external_feature_model.vit.decoder.layers.3.ls1 lr_decay_rate 0.10941898913151242_get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.mlp.linear_fc1.weight key (1.0, 0.007976644307687256, False, False)name module.module.external_feature_model.vit.decoder.layers.1.mlp.linear_fc2.weight lr_decay_rate 0.08862938119652507 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.self_attention.linear_proj.bias key (0.0, 0.010941898913151242, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.mlp.linear_fc2.bias key (0.0, 0.010941898913151242, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.pre_mlp_layernorm.bias key (0.0, 0.007976644307687256, False, False)name module.module.external_feature_model.vit.decoder.layers.7.self_attention.linear_qkv.bias lr_decay_rate 0.16677181699666577 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.mlp.linear_fc1.weight key (1.0, 0.010941898913151242, False, False)name module.module.external_feature_model.vit.decoder.layers.2.pre_mlp_layernorm.bias lr_decay_rate 0.09847709021836118 name module.module.external_feature_model.vit.decoder.layers.2.input_layernorm.bias lr_decay_rate 0.09847709021836118_get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.ls1 key (0.0, 0.010941898913151242, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.mlp.linear_fc2.weight key (1.0, 0.008862938119652507, False, False)name module.module.external_feature_model.vit.decoder.layers.0.mlp.linear_fc1.bias lr_decay_rate 0.07976644307687256 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.self_attention.linear_qkv.bias key (0.0, 0.016677181699666577, False, False) name module.module.external_feature_model.vit.decoder.layers.3.self_attention.linear_qkv.weight lr_decay_rate 0.10941898913151242 name module.module.external_feature_model.vit.decoder.layers.3.mlp.linear_fc1.bias lr_decay_rate 0.10941898913151242name module.module.external_feature_model.vit.decoder.layers.4.ls1 lr_decay_rate 0.12157665459056935_get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.input_layernorm.bias key (0.0, 0.00984770902183612, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.pre_mlp_layernorm.bias key (0.0, 0.00984770902183612, False, False)name module.module.external_feature_model.vit.decoder.layers.0.mlp.linear_fc1.weight lr_decay_rate 0.07976644307687256 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.mlp.linear_fc1.bias key (0.0, 0.007976644307687256, False, False) name module.module.external_feature_model.vit.decoder.layers.1.mlp.linear_fc2.bias lr_decay_rate 0.08862938119652507 name module.module.external_feature_model.vit.decoder.layers.3.ls2 lr_decay_rate 0.10941898913151242_get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.mlp.linear_fc1.bias key (0.0, 0.010941898913151242, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.self_attention.linear_qkv.weight key (1.0, 0.010941898913151242, False, False)name module.module.external_feature_model.vit.decoder.layers.7.pre_mlp_layernorm.weight lr_decay_rate 0.16677181699666577 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.ls1 key (0.0, 0.012157665459056936, False, False)name module.module.external_feature_model.vit.decoder.layers.2.mlp.linear_fc1.weight lr_decay_rate 0.09847709021836118 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.mlp.linear_fc1.weight key (1.0, 0.007976644307687256, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.ls2 key (0.0, 0.010941898913151242, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.mlp.linear_fc2.bias key (0.0, 0.008862938119652507, False, False) name module.module.external_feature_model.vit.decoder.layers.3.self_attention.linear_qkv.bias lr_decay_rate 0.10941898913151242name module.module.external_feature_model.vit.decoder.layers.2.self_attention.linear_proj.weight lr_decay_rate 0.09847709021836118 name module.module.external_feature_model.vit.decoder.layers.0.mlp.linear_fc2.weight lr_decay_rate 0.07976644307687256 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.pre_mlp_layernorm.weight key (0.0, 0.016677181699666577, False, False)name module.module.external_feature_model.vit.decoder.layers.3.mlp.linear_fc2.weight lr_decay_rate 0.10941898913151242 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.mlp.linear_fc1.weight key (1.0, 0.00984770902183612, False, False) name module.module.external_feature_model.vit.decoder.layers.4.ls2 lr_decay_rate 0.12157665459056935name module.module.external_feature_model.vit.decoder.layers.0.mlp.linear_fc1.bias lr_decay_rate 0.07976644307687256 name module.module.external_feature_model.vit.decoder.layers.3.input_layernorm.weight lr_decay_rate 0.10941898913151242_get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.self_attention.linear_qkv.bias key (0.0, 0.010941898913151242, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.self_attention.linear_proj.weight key (1.0, 0.00984770902183612, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.mlp.linear_fc2.weight key (1.0, 0.007976644307687256, False, False)name module.module.external_feature_model.vit.decoder.layers.2.ls1 lr_decay_rate 0.09847709021836118 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.mlp.linear_fc2.weight key (1.0, 0.010941898913151242, False, False)name module.module.external_feature_model.vit.decoder.layers.7.pre_mlp_layernorm.bias lr_decay_rate 0.16677181699666577 name module.module.external_feature_model.vit.decoder.layers.2.mlp.linear_fc1.bias lr_decay_rate 0.09847709021836118 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.ls2 key (0.0, 0.012157665459056936, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.mlp.linear_fc1.bias key (0.0, 0.007976644307687256, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.input_layernorm.weight key (0.0, 0.010941898913151242, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.ls1 key (0.0, 0.00984770902183612, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.pre_mlp_layernorm.bias key (0.0, 0.016677181699666577, False, False)name module.module.external_feature_model.vit.decoder.layers.2.self_attention.linear_proj.bias lr_decay_rate 0.09847709021836118name module.module.external_feature_model.vit.decoder.layers.0.mlp.linear_fc2.bias lr_decay_rate 0.07976644307687256 name module.module.external_feature_model.vit.decoder.layers.3.mlp.linear_fc2.bias lr_decay_rate 0.10941898913151242 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.mlp.linear_fc1.bias key (0.0, 0.00984770902183612, False, False)name module.module.external_feature_model.vit.decoder.layers.3.pre_mlp_layernorm.weight lr_decay_rate 0.10941898913151242 name module.module.external_feature_model.vit.decoder.layers.4.input_layernorm.weight lr_decay_rate 0.12157665459056935name module.module.external_feature_model.vit.decoder.layers.3.input_layernorm.bias lr_decay_rate 0.10941898913151242 name module.module.external_feature_model.vit.decoder.layers.0.mlp.linear_fc2.weight lr_decay_rate 0.07976644307687256 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.self_attention.linear_proj.bias key (0.0, 0.00984770902183612, False, False)name module.module.external_feature_model.vit.decoder.layers.2.ls2 lr_decay_rate 0.09847709021836118_get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.mlp.linear_fc2.bias key (0.0, 0.007976644307687256, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.pre_mlp_layernorm.weight key (0.0, 0.010941898913151242, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.mlp.linear_fc2.bias key (0.0, 0.010941898913151242, False, False) name module.module.external_feature_model.vit.decoder.layers.7.mlp.linear_fc1.weight lr_decay_rate 0.16677181699666577 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.input_layernorm.bias key (0.0, 0.010941898913151242, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.input_layernorm.weight key (0.0, 0.012157665459056936, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.mlp.linear_fc2.weight key (1.0, 0.007976644307687256, False, False)name module.module.external_feature_model.vit.decoder.layers.2.mlp.linear_fc2.weight lr_decay_rate 0.09847709021836118 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.ls2 key (0.0, 0.00984770902183612, False, False) name module.module.external_feature_model.vit.decoder.layers.2.self_attention.linear_qkv.weight lr_decay_rate 0.09847709021836118 name module.module.external_feature_model.vit.decoder.layers.3.pre_mlp_layernorm.bias lr_decay_rate 0.10941898913151242 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.mlp.linear_fc1.weight key (1.0, 0.016677181699666577, False, False)name module.module.external_feature_model.vit.decoder.layers.1.ls1 lr_decay_rate 0.08862938119652507 name module.module.external_feature_model.vit.decoder.layers.4.ls1 lr_decay_rate 0.12157665459056935_get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.mlp.linear_fc2.weight key (1.0, 0.00984770902183612, False, False) name module.module.external_feature_model.vit.decoder.layers.4.input_layernorm.bias lr_decay_rate 0.12157665459056935name module.module.external_feature_model.vit.decoder.layers.0.mlp.linear_fc2.bias lr_decay_rate 0.07976644307687256_get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.self_attention.linear_qkv.weight key (1.0, 0.00984770902183612, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.pre_mlp_layernorm.bias key (0.0, 0.010941898913151242, False, False)name module.module.external_feature_model.vit.decoder.layers.2.input_layernorm.weight lr_decay_rate 0.09847709021836118 name module.module.external_feature_model.vit.decoder.layers.7.mlp.linear_fc1.bias lr_decay_rate 0.16677181699666577 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.ls1 key (0.0, 0.012157665459056936, False, False)name module.module.external_feature_model.vit.decoder.layers.3.self_attention.linear_proj.weight lr_decay_rate 0.10941898913151242_get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.ls1 key (0.0, 0.008862938119652507, False, False) name module.module.external_feature_model.vit.decoder.layers.2.mlp.linear_fc2.bias lr_decay_rate 0.09847709021836118 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.mlp.linear_fc2.bias key (0.0, 0.007976644307687256, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.input_layernorm.bias key (0.0, 0.012157665459056936, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.input_layernorm.weight key (0.0, 0.00984770902183612, False, False) name module.module.external_feature_model.vit.decoder.layers.2.self_attention.linear_qkv.bias lr_decay_rate 0.09847709021836118 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.mlp.linear_fc1.bias key (0.0, 0.016677181699666577, False, False) name module.module.external_feature_model.vit.decoder.layers.3.mlp.linear_fc1.weight lr_decay_rate 0.10941898913151242 name module.module.external_feature_model.vit.decoder.layers.4.ls2 lr_decay_rate 0.12157665459056935 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.mlp.linear_fc2.bias key (0.0, 0.00984770902183612, False, False) name module.module.external_feature_model.vit.decoder.layers.1.ls2 lr_decay_rate 0.08862938119652507 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.self_attention.linear_proj.weight key (1.0, 0.010941898913151242, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.self_attention.linear_qkv.bias key (0.0, 0.00984770902183612, False, False)name module.module.external_feature_model.vit.decoder.layers.2.input_layernorm.bias lr_decay_rate 0.09847709021836118_get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.mlp.linear_fc1.weight key (1.0, 0.010941898913151242, False, False) name module.module.external_feature_model.vit.decoder.layers.1.ls1 lr_decay_rate 0.08862938119652507_get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.ls2 key (0.0, 0.008862938119652507, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.ls2 key (0.0, 0.012157665459056936, False, False) name module.module.external_feature_model.vit.decoder.layers.7.mlp.linear_fc2.weight lr_decay_rate 0.16677181699666577 name module.module.external_feature_model.vit.decoder.layers.3.self_attention.linear_proj.bias lr_decay_rate 0.10941898913151242 name module.module.external_feature_model.vit.decoder.layers.4.self_attention.linear_proj.weight lr_decay_rate 0.12157665459056935 name module.module.external_feature_model.vit.decoder.layers.3.ls1 lr_decay_rate 0.10941898913151242 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.input_layernorm.bias key (0.0, 0.00984770902183612, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.mlp.linear_fc2.weight key (1.0, 0.016677181699666577, False, False) name module.module.external_feature_model.vit.decoder.layers.2.pre_mlp_layernorm.weight lr_decay_rate 0.09847709021836118name module.module.external_feature_model.vit.decoder.layers.3.mlp.linear_fc1.bias lr_decay_rate 0.10941898913151242 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.ls1 key (0.0, 0.008862938119652507, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.self_attention.linear_proj.bias key (0.0, 0.010941898913151242, False, False)name module.module.external_feature_model.vit.decoder.layers.4.input_layernorm.weight lr_decay_rate 0.12157665459056935 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.ls1 key (0.0, 0.010941898913151242, False, False)name module.module.external_feature_model.vit.decoder.layers.1.input_layernorm.weight lr_decay_rate 0.08862938119652507 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.self_attention.linear_proj.weight key (1.0, 0.012157665459056936, False, False)name module.module.external_feature_model.vit.decoder.layers.7.mlp.linear_fc2.bias lr_decay_rate 0.16677181699666577 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.mlp.linear_fc1.bias key (0.0, 0.010941898913151242, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.pre_mlp_layernorm.weight key (0.0, 0.00984770902183612, False, False)name module.module.external_feature_model.vit.decoder.layers.2.self_attention.linear_proj.weight lr_decay_rate 0.09847709021836118 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.input_layernorm.weight key (0.0, 0.012157665459056936, False, False)name module.module.external_feature_model.vit.decoder.layers.1.ls2 lr_decay_rate 0.08862938119652507 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.input_layernorm.weight key (0.0, 0.008862938119652507, False, False)name module.module.external_feature_model.vit.decoder.layers.3.self_attention.linear_qkv.weight lr_decay_rate 0.10941898913151242name module.module.external_feature_model.vit.decoder.layers.3.ls2 lr_decay_rate 0.10941898913151242 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.mlp.linear_fc2.bias key (0.0, 0.016677181699666577, False, False) name module.module.external_feature_model.vit.decoder.layers.4.self_attention.linear_proj.bias lr_decay_rate 0.12157665459056935_get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.self_attention.linear_proj.weight key (1.0, 0.00984770902183612, False, False)name module.module.external_feature_model.vit.decoder.layers.2.pre_mlp_layernorm.bias lr_decay_rate 0.09847709021836118 name module.module.external_feature_model.vit.decoder.layers.3.mlp.linear_fc2.weight lr_decay_rate 0.10941898913151242_get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.ls2 key (0.0, 0.008862938119652507, False, False)name module.module.external_feature_model.vit.decoder.layers.4.input_layernorm.bias lr_decay_rate 0.12157665459056935 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.ls2 key (0.0, 0.010941898913151242, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.self_attention.linear_qkv.weight key (1.0, 0.010941898913151242, False, False)name module.module.external_feature_model.vit.decoder.layers.1.input_layernorm.bias lr_decay_rate 0.08862938119652507 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.pre_mlp_layernorm.bias key (0.0, 0.00984770902183612, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.self_attention.linear_proj.bias key (0.0, 0.012157665459056936, False, False) name module.module.external_feature_model.vit.decoder.layers.8.ls1 lr_decay_rate 0.18530201888518416name module.module.external_feature_model.vit.decoder.layers.2.self_attention.linear_proj.bias lr_decay_rate 0.09847709021836118_get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.input_layernorm.bias key (0.0, 0.012157665459056936, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.mlp.linear_fc2.weight key (1.0, 0.010941898913151242, False, False) name module.module.external_feature_model.vit.decoder.layers.1.input_layernorm.weight lr_decay_rate 0.08862938119652507name module.module.external_feature_model.vit.decoder.layers.3.self_attention.linear_qkv.bias lr_decay_rate 0.10941898913151242 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.input_layernorm.bias key (0.0, 0.008862938119652507, False, False)name module.module.external_feature_model.vit.decoder.layers.3.input_layernorm.weight lr_decay_rate 0.10941898913151242 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.self_attention.linear_proj.bias key (0.0, 0.00984770902183612, False, False) name module.module.external_feature_model.vit.decoder.layers.2.mlp.linear_fc1.weight lr_decay_rate 0.09847709021836118 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.ls1 key (0.0, 0.018530201888518418, False, False) name module.module.external_feature_model.vit.decoder.layers.4.self_attention.linear_qkv.weight lr_decay_rate 0.12157665459056935name module.module.external_feature_model.vit.decoder.layers.3.mlp.linear_fc2.bias lr_decay_rate 0.10941898913151242 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.self_attention.linear_qkv.bias key (0.0, 0.010941898913151242, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.input_layernorm.weight key (0.0, 0.008862938119652507, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.input_layernorm.weight key (0.0, 0.010941898913151242, False, False)name module.module.external_feature_model.vit.decoder.layers.4.self_attention.linear_proj.weight lr_decay_rate 0.12157665459056935 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.mlp.linear_fc1.weight key (1.0, 0.00984770902183612, False, False) name module.module.external_feature_model.vit.decoder.layers.8.ls2 lr_decay_rate 0.18530201888518416name module.module.external_feature_model.vit.decoder.layers.2.self_attention.linear_qkv.weight lr_decay_rate 0.09847709021836118name module.module.external_feature_model.vit.decoder.layers.1.self_attention.linear_proj.weight lr_decay_rate 0.08862938119652507 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.self_attention.linear_qkv.weight key (1.0, 0.012157665459056936, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.mlp.linear_fc2.bias key (0.0, 0.010941898913151242, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.self_attention.linear_proj.weight key (1.0, 0.012157665459056936, False, False)name module.module.external_feature_model.vit.decoder.layers.1.input_layernorm.bias lr_decay_rate 0.08862938119652507name module.module.external_feature_model.vit.decoder.layers.3.input_layernorm.bias lr_decay_rate 0.10941898913151242 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.ls2 key (0.0, 0.018530201888518418, False, False)name module.module.external_feature_model.vit.decoder.layers.3.pre_mlp_layernorm.weight lr_decay_rate 0.10941898913151242name module.module.external_feature_model.vit.decoder.layers.2.mlp.linear_fc1.bias lr_decay_rate 0.09847709021836118 name module.module.external_feature_model.vit.decoder.layers.4.self_attention.linear_qkv.bias lr_decay_rate 0.12157665459056935_get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.self_attention.linear_qkv.weight key (1.0, 0.00984770902183612, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.self_attention.linear_proj.weight key (1.0, 0.008862938119652507, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.input_layernorm.bias key (0.0, 0.008862938119652507, False, False)name module.module.external_feature_model.vit.decoder.layers.4.ls1 lr_decay_rate 0.12157665459056935name module.module.external_feature_model.vit.decoder.layers.4.self_attention.linear_proj.bias lr_decay_rate 0.12157665459056935_get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.input_layernorm.bias key (0.0, 0.010941898913151242, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.mlp.linear_fc1.bias key (0.0, 0.00984770902183612, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.pre_mlp_layernorm.weight key (0.0, 0.010941898913151242, False, False) name module.module.external_feature_model.vit.decoder.layers.8.input_layernorm.weight lr_decay_rate 0.18530201888518416 name module.module.external_feature_model.vit.decoder.layers.2.self_attention.linear_qkv.bias lr_decay_rate 0.09847709021836118_get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.self_attention.linear_qkv.bias key (0.0, 0.012157665459056936, False, False) name module.module.external_feature_model.vit.decoder.layers.1.self_attention.linear_proj.bias lr_decay_rate 0.08862938119652507 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.self_attention.linear_proj.bias key (0.0, 0.012157665459056936, False, False) name module.module.external_feature_model.vit.decoder.layers.2.mlp.linear_fc2.weight lr_decay_rate 0.09847709021836118_get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.ls1 key (0.0, 0.012157665459056936, False, False) name module.module.external_feature_model.vit.decoder.layers.3.pre_mlp_layernorm.bias lr_decay_rate 0.10941898913151242 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.input_layernorm.weight key (0.0, 0.018530201888518418, False, False)name module.module.external_feature_model.vit.decoder.layers.1.self_attention.linear_proj.weight lr_decay_rate 0.08862938119652507 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.self_attention.linear_qkv.bias key (0.0, 0.00984770902183612, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.self_attention.linear_proj.bias key (0.0, 0.008862938119652507, False, False)name module.module.external_feature_model.vit.decoder.layers.3.self_attention.linear_proj.weight lr_decay_rate 0.10941898913151242 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.mlp.linear_fc2.weight key (1.0, 0.00984770902183612, False, False) name module.module.external_feature_model.vit.decoder.layers.4.pre_mlp_layernorm.weight lr_decay_rate 0.12157665459056935 name module.module.external_feature_model.vit.decoder.layers.4.self_attention.linear_qkv.weight lr_decay_rate 0.12157665459056935name module.module.external_feature_model.vit.decoder.layers.4.ls2 lr_decay_rate 0.12157665459056935 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.pre_mlp_layernorm.bias key (0.0, 0.010941898913151242, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.self_attention.linear_proj.weight key (1.0, 0.008862938119652507, False, False) name module.module.external_feature_model.vit.decoder.layers.8.input_layernorm.bias lr_decay_rate 0.18530201888518416 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.self_attention.linear_proj.weight key (1.0, 0.010941898913151242, False, False) name module.module.external_feature_model.vit.decoder.layers.2.mlp.linear_fc2.bias lr_decay_rate 0.09847709021836118_get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.pre_mlp_layernorm.weight key (0.0, 0.012157665459056936, False, False) name module.module.external_feature_model.vit.decoder.layers.2.pre_mlp_layernorm.weight lr_decay_rate 0.09847709021836118name module.module.external_feature_model.vit.decoder.layers.1.self_attention.linear_qkv.weight lr_decay_rate 0.08862938119652507_get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.self_attention.linear_qkv.weight key (1.0, 0.012157665459056936, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.ls2 key (0.0, 0.012157665459056936, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.input_layernorm.bias key (0.0, 0.018530201888518418, False, False)name module.module.external_feature_model.vit.decoder.layers.1.self_attention.linear_proj.bias lr_decay_rate 0.08862938119652507name module.module.external_feature_model.vit.decoder.layers.3.mlp.linear_fc1.weight lr_decay_rate 0.10941898913151242 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.mlp.linear_fc2.bias key (0.0, 0.00984770902183612, False, False)name module.module.external_feature_model.vit.decoder.layers.3.self_attention.linear_proj.bias lr_decay_rate 0.10941898913151242_get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.pre_mlp_layernorm.weight key (0.0, 0.00984770902183612, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.self_attention.linear_qkv.weight key (1.0, 0.008862938119652507, False, False)name module.module.external_feature_model.vit.decoder.layers.4.pre_mlp_layernorm.bias lr_decay_rate 0.12157665459056935 name module.module.external_feature_model.vit.decoder.layers.4.self_attention.linear_qkv.bias lr_decay_rate 0.12157665459056935_get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.mlp.linear_fc1.weight key (1.0, 0.010941898913151242, False, False)name module.module.external_feature_model.vit.decoder.layers.4.input_layernorm.weight lr_decay_rate 0.12157665459056935 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.self_attention.linear_proj.bias key (0.0, 0.008862938119652507, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.self_attention.linear_proj.bias key (0.0, 0.010941898913151242, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.pre_mlp_layernorm.bias key (0.0, 0.012157665459056936, False, False)name module.module.external_feature_model.vit.decoder.layers.8.self_attention.linear_proj.weight lr_decay_rate 0.18530201888518416 name module.module.external_feature_model.vit.decoder.layers.3.ls1 lr_decay_rate 0.10941898913151242name module.module.external_feature_model.vit.decoder.layers.1.self_attention.linear_qkv.bias lr_decay_rate 0.08862938119652507 name module.module.external_feature_model.vit.decoder.layers.2.pre_mlp_layernorm.bias lr_decay_rate 0.09847709021836118 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.self_attention.linear_qkv.bias key (0.0, 0.012157665459056936, False, False) name module.module.external_feature_model.vit.decoder.layers.3.mlp.linear_fc1.bias lr_decay_rate 0.10941898913151242_get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.input_layernorm.weight key (0.0, 0.012157665459056936, False, False) name module.module.external_feature_model.vit.decoder.layers.1.self_attention.linear_qkv.weight lr_decay_rate 0.08862938119652507 name module.module.external_feature_model.vit.decoder.layers.3.self_attention.linear_qkv.weight lr_decay_rate 0.10941898913151242_get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.self_attention.linear_qkv.bias key (0.0, 0.008862938119652507, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.self_attention.linear_proj.weight key (1.0, 0.018530201888518418, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.pre_mlp_layernorm.bias key (0.0, 0.00984770902183612, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.ls1 key (0.0, 0.010941898913151242, False, False) name module.module.external_feature_model.vit.decoder.layers.4.mlp.linear_fc1.weight lr_decay_rate 0.12157665459056935_get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.mlp.linear_fc1.bias key (0.0, 0.010941898913151242, False, False) name module.module.external_feature_model.vit.decoder.layers.4.input_layernorm.bias lr_decay_rate 0.12157665459056935 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.self_attention.linear_qkv.weight key (1.0, 0.008862938119652507, False, False)name module.module.external_feature_model.vit.decoder.layers.4.pre_mlp_layernorm.weight lr_decay_rate 0.12157665459056935_get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.self_attention.linear_qkv.weight key (1.0, 0.010941898913151242, False, False) name module.module.external_feature_model.vit.decoder.layers.8.self_attention.linear_proj.bias lr_decay_rate 0.18530201888518416 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.mlp.linear_fc1.weight key (1.0, 0.012157665459056936, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.input_layernorm.bias key (0.0, 0.012157665459056936, False, False)name module.module.external_feature_model.vit.decoder.layers.1.pre_mlp_layernorm.weight lr_decay_rate 0.08862938119652507 name module.module.external_feature_model.vit.decoder.layers.3.mlp.linear_fc2.weight lr_decay_rate 0.10941898913151242 name module.module.external_feature_model.vit.decoder.layers.3.ls2 lr_decay_rate 0.10941898913151242name module.module.external_feature_model.vit.decoder.layers.2.mlp.linear_fc1.weight lr_decay_rate 0.09847709021836118_get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.pre_mlp_layernorm.weight key (0.0, 0.012157665459056936, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.self_attention.linear_proj.bias key (0.0, 0.018530201888518418, False, False) name module.module.external_feature_model.vit.decoder.layers.3.self_attention.linear_qkv.bias lr_decay_rate 0.10941898913151242name module.module.external_feature_model.vit.decoder.layers.4.mlp.linear_fc1.bias lr_decay_rate 0.12157665459056935name module.module.external_feature_model.vit.decoder.layers.1.self_attention.linear_qkv.bias lr_decay_rate 0.08862938119652507 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.pre_mlp_layernorm.weight key (0.0, 0.008862938119652507, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.ls2 key (0.0, 0.010941898913151242, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.mlp.linear_fc2.weight key (1.0, 0.010941898913151242, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.mlp.linear_fc1.weight key (1.0, 0.00984770902183612, False, False) name module.module.external_feature_model.vit.decoder.layers.4.self_attention.linear_proj.weight lr_decay_rate 0.12157665459056935name module.module.external_feature_model.vit.decoder.layers.4.pre_mlp_layernorm.bias lr_decay_rate 0.12157665459056935name module.module.external_feature_model.vit.decoder.layers.8.self_attention.linear_qkv.weight lr_decay_rate 0.18530201888518416_get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.self_attention.linear_qkv.bias key (0.0, 0.010941898913151242, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.mlp.linear_fc1.bias key (0.0, 0.012157665459056936, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.self_attention.linear_qkv.bias key (0.0, 0.008862938119652507, False, False) name module.module.external_feature_model.vit.decoder.layers.1.pre_mlp_layernorm.bias lr_decay_rate 0.08862938119652507 name module.module.external_feature_model.vit.decoder.layers.3.mlp.linear_fc2.bias lr_decay_rate 0.10941898913151242name module.module.external_feature_model.vit.decoder.layers.2.mlp.linear_fc1.bias lr_decay_rate 0.09847709021836118 name module.module.external_feature_model.vit.decoder.layers.3.input_layernorm.weight lr_decay_rate 0.10941898913151242 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.pre_mlp_layernorm.bias key (0.0, 0.012157665459056936, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.self_attention.linear_proj.weight key (1.0, 0.012157665459056936, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.self_attention.linear_qkv.weight key (1.0, 0.018530201888518418, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.pre_mlp_layernorm.bias key (0.0, 0.008862938119652507, False, False)name module.module.external_feature_model.vit.decoder.layers.4.mlp.linear_fc2.weight lr_decay_rate 0.12157665459056935_get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.mlp.linear_fc2.bias key (0.0, 0.010941898913151242, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.mlp.linear_fc1.bias key (0.0, 0.00984770902183612, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.input_layernorm.weight key (0.0, 0.010941898913151242, False, False)name module.module.external_feature_model.vit.decoder.layers.3.pre_mlp_layernorm.weight lr_decay_rate 0.10941898913151242name module.module.external_feature_model.vit.decoder.layers.1.pre_mlp_layernorm.weight lr_decay_rate 0.08862938119652507name module.module.external_feature_model.vit.decoder.layers.8.self_attention.linear_qkv.bias lr_decay_rate 0.18530201888518416name module.module.external_feature_model.vit.decoder.layers.4.self_attention.linear_proj.bias lr_decay_rate 0.12157665459056935 name module.module.external_feature_model.vit.decoder.layers.4.mlp.linear_fc1.weight lr_decay_rate 0.12157665459056935_get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.mlp.linear_fc2.weight key (1.0, 0.012157665459056936, False, False) name module.module.external_feature_model.vit.decoder.layers.2.mlp.linear_fc2.weight lr_decay_rate 0.09847709021836118name module.module.external_feature_model.vit.decoder.layers.1.mlp.linear_fc1.weight lr_decay_rate 0.08862938119652507 name module.module.external_feature_model.vit.decoder.layers.4.ls1 lr_decay_rate 0.12157665459056935 name module.module.external_feature_model.vit.decoder.layers.3.input_layernorm.bias lr_decay_rate 0.10941898913151242_get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.mlp.linear_fc1.weight key (1.0, 0.012157665459056936, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.pre_mlp_layernorm.weight key (0.0, 0.008862938119652507, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.mlp.linear_fc1.weight key (1.0, 0.008862938119652507, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.pre_mlp_layernorm.weight key (0.0, 0.010941898913151242, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.self_attention.linear_qkv.bias key (0.0, 0.018530201888518418, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.self_attention.linear_proj.bias key (0.0, 0.012157665459056936, False, False) name module.module.external_feature_model.vit.decoder.layers.4.mlp.linear_fc2.bias lr_decay_rate 0.12157665459056935_get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.mlp.linear_fc2.weight key (1.0, 0.00984770902183612, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.ls1 key (0.0, 0.012157665459056936, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.input_layernorm.bias key (0.0, 0.010941898913151242, False, False) name module.module.external_feature_model.vit.decoder.layers.1.pre_mlp_layernorm.bias lr_decay_rate 0.08862938119652507 name module.module.external_feature_model.vit.decoder.layers.4.mlp.linear_fc1.bias lr_decay_rate 0.12157665459056935 name module.module.external_feature_model.vit.decoder.layers.1.mlp.linear_fc1.bias lr_decay_rate 0.08862938119652507name module.module.external_feature_model.vit.decoder.layers.2.mlp.linear_fc2.bias lr_decay_rate 0.09847709021836118 name module.module.external_feature_model.vit.decoder.layers.3.pre_mlp_layernorm.bias lr_decay_rate 0.10941898913151242 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.mlp.linear_fc2.bias key (0.0, 0.012157665459056936, False, False) name module.module.external_feature_model.vit.decoder.layers.8.pre_mlp_layernorm.weight lr_decay_rate 0.18530201888518416name module.module.external_feature_model.vit.decoder.layers.4.self_attention.linear_qkv.weight lr_decay_rate 0.12157665459056935_get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.pre_mlp_layernorm.bias key (0.0, 0.008862938119652507, False, False)name module.module.external_feature_model.vit.decoder.layers.4.ls2 lr_decay_rate 0.12157665459056935 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.mlp.linear_fc1.bias key (0.0, 0.012157665459056936, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.mlp.linear_fc2.bias key (0.0, 0.00984770902183612, False, False)name module.module.external_feature_model.vit.decoder.layers.3.self_attention.linear_proj.weight lr_decay_rate 0.10941898913151242 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.mlp.linear_fc1.bias key (0.0, 0.008862938119652507, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.pre_mlp_layernorm.bias key (0.0, 0.010941898913151242, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.pre_mlp_layernorm.weight key (0.0, 0.018530201888518418, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.self_attention.linear_qkv.weight key (1.0, 0.012157665459056936, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.ls2 key (0.0, 0.012157665459056936, False, False)name module.module.external_feature_model.vit.decoder.layers.1.mlp.linear_fc1.weight lr_decay_rate 0.08862938119652507 name module.module.external_feature_model.vit.decoder.layers.5.ls1 lr_decay_rate 0.13508517176729928_get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.self_attention.linear_proj.weight key (1.0, 0.010941898913151242, False, False) name module.module.external_feature_model.vit.decoder.layers.4.mlp.linear_fc2.weight lr_decay_rate 0.12157665459056935name module.module.external_feature_model.vit.decoder.layers.1.mlp.linear_fc2.weight lr_decay_rate 0.08862938119652507 name module.module.external_feature_model.vit.decoder.layers.3.mlp.linear_fc1.weight lr_decay_rate 0.10941898913151242 name module.module.external_feature_model.vit.decoder.layers.3.ls1 lr_decay_rate 0.10941898913151242 name module.module.external_feature_model.vit.decoder.layers.8.pre_mlp_layernorm.bias lr_decay_rate 0.18530201888518416 name module.module.external_feature_model.vit.decoder.layers.4.self_attention.linear_qkv.bias lr_decay_rate 0.12157665459056935 name module.module.external_feature_model.vit.decoder.layers.4.input_layernorm.weight lr_decay_rate 0.12157665459056935_get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.mlp.linear_fc1.weight key (1.0, 0.008862938119652507, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.mlp.linear_fc2.weight key (1.0, 0.008862938119652507, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.ls1 key (0.0, 0.013508517176729929, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.mlp.linear_fc2.weight key (1.0, 0.012157665459056936, False, False)name module.module.external_feature_model.vit.decoder.layers.3.self_attention.linear_proj.bias lr_decay_rate 0.10941898913151242_get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.mlp.linear_fc1.weight key (1.0, 0.010941898913151242, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.ls1 key (0.0, 0.010941898913151242, False, False) name module.module.external_feature_model.vit.decoder.layers.1.mlp.linear_fc1.bias lr_decay_rate 0.08862938119652507_get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.pre_mlp_layernorm.bias key (0.0, 0.018530201888518418, False, False)name module.module.external_feature_model.vit.decoder.layers.1.mlp.linear_fc2.bias lr_decay_rate 0.08862938119652507 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.self_attention.linear_qkv.bias key (0.0, 0.012157665459056936, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.input_layernorm.weight key (0.0, 0.012157665459056936, False, False) name module.module.external_feature_model.vit.decoder.layers.3.mlp.linear_fc1.bias lr_decay_rate 0.10941898913151242name module.module.external_feature_model.vit.decoder.layers.5.ls2 lr_decay_rate 0.13508517176729928 name module.module.external_feature_model.vit.decoder.layers.4.mlp.linear_fc2.bias lr_decay_rate 0.12157665459056935_get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.self_attention.linear_proj.bias key (0.0, 0.010941898913151242, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.mlp.linear_fc2.bias key (0.0, 0.008862938119652507, False, False) name module.module.external_feature_model.vit.decoder.layers.3.ls2 lr_decay_rate 0.10941898913151242_get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.mlp.linear_fc1.bias key (0.0, 0.008862938119652507, False, False) name module.module.external_feature_model.vit.decoder.layers.4.input_layernorm.bias lr_decay_rate 0.12157665459056935name module.module.external_feature_model.vit.decoder.layers.8.mlp.linear_fc1.weight lr_decay_rate 0.18530201888518416 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.ls2 key (0.0, 0.013508517176729929, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.mlp.linear_fc1.bias key (0.0, 0.010941898913151242, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.mlp.linear_fc2.bias key (0.0, 0.012157665459056936, False, False)name module.module.external_feature_model.vit.decoder.layers.4.pre_mlp_layernorm.weight lr_decay_rate 0.12157665459056935 name module.module.external_feature_model.vit.decoder.layers.3.self_attention.linear_qkv.weight lr_decay_rate 0.10941898913151242 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.ls2 key (0.0, 0.010941898913151242, False, False) name module.module.external_feature_model.vit.decoder.layers.1.mlp.linear_fc2.weight lr_decay_rate 0.08862938119652507 name module.module.external_feature_model.vit.decoder.layers.2.ls1 lr_decay_rate 0.09847709021836118_get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.input_layernorm.bias key (0.0, 0.012157665459056936, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.mlp.linear_fc1.weight key (1.0, 0.018530201888518418, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.pre_mlp_layernorm.weight key (0.0, 0.012157665459056936, False, False)name module.module.external_feature_model.vit.decoder.layers.3.mlp.linear_fc2.weight lr_decay_rate 0.10941898913151242 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.self_attention.linear_qkv.weight key (1.0, 0.010941898913151242, False, False)name module.module.external_feature_model.vit.decoder.layers.5.input_layernorm.weight lr_decay_rate 0.13508517176729928 name module.module.external_feature_model.vit.decoder.layers.5.ls1 lr_decay_rate 0.13508517176729928 name module.module.external_feature_model.vit.decoder.layers.3.input_layernorm.weight lr_decay_rate 0.10941898913151242 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.mlp.linear_fc2.weight key (1.0, 0.008862938119652507, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.ls1 key (0.0, 0.00984770902183612, False, False)name module.module.external_feature_model.vit.decoder.layers.8.mlp.linear_fc1.bias lr_decay_rate 0.18530201888518416 name module.module.external_feature_model.vit.decoder.layers.4.pre_mlp_layernorm.bias lr_decay_rate 0.12157665459056935_get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.mlp.linear_fc2.weight key (1.0, 0.010941898913151242, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.input_layernorm.weight key (0.0, 0.010941898913151242, False, False)name module.module.external_feature_model.vit.decoder.layers.4.self_attention.linear_proj.weight lr_decay_rate 0.12157665459056935 name module.module.external_feature_model.vit.decoder.layers.3.self_attention.linear_qkv.bias lr_decay_rate 0.10941898913151242 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.input_layernorm.weight key (0.0, 0.013508517176729929, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.ls1 key (0.0, 0.013508517176729929, False, False) name module.module.external_feature_model.vit.decoder.layers.1.mlp.linear_fc2.bias lr_decay_rate 0.08862938119652507 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.pre_mlp_layernorm.bias key (0.0, 0.012157665459056936, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.mlp.linear_fc1.bias key (0.0, 0.018530201888518418, False, False) name module.module.external_feature_model.vit.decoder.layers.3.input_layernorm.bias lr_decay_rate 0.10941898913151242 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.self_attention.linear_proj.weight key (1.0, 0.012157665459056936, False, False)name module.module.external_feature_model.vit.decoder.layers.3.mlp.linear_fc2.bias lr_decay_rate 0.10941898913151242_get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.self_attention.linear_qkv.bias key (0.0, 0.010941898913151242, False, False) name module.module.external_feature_model.vit.decoder.layers.5.input_layernorm.bias lr_decay_rate 0.13508517176729928_get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.mlp.linear_fc2.bias key (0.0, 0.008862938119652507, False, False) name module.module.external_feature_model.vit.decoder.layers.5.ls2 lr_decay_rate 0.13508517176729928name module.module.external_feature_model.vit.decoder.layers.2.ls2 lr_decay_rate 0.09847709021836118_get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.input_layernorm.bias key (0.0, 0.010941898913151242, False, False) name module.module.external_feature_model.vit.decoder.layers.4.mlp.linear_fc1.weight lr_decay_rate 0.12157665459056935name module.module.external_feature_model.vit.decoder.layers.8.mlp.linear_fc2.weight lr_decay_rate 0.18530201888518416_get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.mlp.linear_fc2.bias key (0.0, 0.010941898913151242, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.input_layernorm.bias key (0.0, 0.013508517176729929, False, False)name module.module.external_feature_model.vit.decoder.layers.4.self_attention.linear_proj.bias lr_decay_rate 0.12157665459056935 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.ls2 key (0.0, 0.013508517176729929, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.ls2 key (0.0, 0.00984770902183612, False, False)name module.module.external_feature_model.vit.decoder.layers.2.ls1 lr_decay_rate 0.09847709021836118name module.module.external_feature_model.vit.decoder.layers.3.pre_mlp_layernorm.weight lr_decay_rate 0.10941898913151242 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.mlp.linear_fc1.weight key (1.0, 0.012157665459056936, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.mlp.linear_fc2.weight key (1.0, 0.018530201888518418, False, False) name module.module.external_feature_model.vit.decoder.layers.3.self_attention.linear_proj.weight lr_decay_rate 0.10941898913151242 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.self_attention.linear_proj.bias key (0.0, 0.012157665459056936, False, False)name module.module.external_feature_model.vit.decoder.layers.4.ls1 lr_decay_rate 0.12157665459056935 name module.module.external_feature_model.vit.decoder.layers.5.input_layernorm.weight lr_decay_rate 0.13508517176729928name module.module.external_feature_model.vit.decoder.layers.5.self_attention.linear_proj.weight lr_decay_rate 0.13508517176729928_get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.ls1 key (0.0, 0.00984770902183612, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.pre_mlp_layernorm.weight key (0.0, 0.010941898913151242, False, False) name module.module.external_feature_model.vit.decoder.layers.4.mlp.linear_fc1.bias lr_decay_rate 0.12157665459056935name module.module.external_feature_model.vit.decoder.layers.8.mlp.linear_fc2.bias lr_decay_rate 0.18530201888518416 name module.module.external_feature_model.vit.decoder.layers.2.input_layernorm.weight lr_decay_rate 0.09847709021836118_get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.self_attention.linear_proj.weight key (1.0, 0.010941898913151242, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.ls1 key (0.0, 0.012157665459056936, False, False) name module.module.external_feature_model.vit.decoder.layers.4.self_attention.linear_qkv.weight lr_decay_rate 0.12157665459056935 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.input_layernorm.weight key (0.0, 0.013508517176729929, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.self_attention.linear_proj.weight key (1.0, 0.013508517176729929, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.mlp.linear_fc1.bias key (0.0, 0.012157665459056936, False, False)name module.module.external_feature_model.vit.decoder.layers.3.pre_mlp_layernorm.bias lr_decay_rate 0.10941898913151242 name module.module.external_feature_model.vit.decoder.layers.2.ls2 lr_decay_rate 0.09847709021836118 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.mlp.linear_fc2.bias key (0.0, 0.018530201888518418, False, False)name module.module.external_feature_model.vit.decoder.layers.4.ls2 lr_decay_rate 0.12157665459056935name module.module.external_feature_model.vit.decoder.layers.3.self_attention.linear_proj.bias lr_decay_rate 0.10941898913151242 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.input_layernorm.weight key (0.0, 0.00984770902183612, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.self_attention.linear_qkv.weight key (1.0, 0.012157665459056936, False, False) name module.module.external_feature_model.vit.decoder.layers.5.input_layernorm.bias lr_decay_rate 0.13508517176729928_get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.pre_mlp_layernorm.bias key (0.0, 0.010941898913151242, False, False) name module.module.external_feature_model.vit.decoder.layers.5.self_attention.linear_proj.bias lr_decay_rate 0.13508517176729928 name module.module.external_feature_model.vit.decoder.layers.4.mlp.linear_fc2.weight lr_decay_rate 0.12157665459056935 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.self_attention.linear_proj.bias key (0.0, 0.010941898913151242, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.ls2 key (0.0, 0.00984770902183612, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.ls2 key (0.0, 0.012157665459056936, False, False) name module.module.external_feature_model.vit.decoder.layers.9.ls1 lr_decay_rate 0.20589113209464907name module.module.external_feature_model.vit.decoder.layers.2.input_layernorm.bias lr_decay_rate 0.09847709021836118 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.input_layernorm.bias key (0.0, 0.013508517176729929, False, False) name module.module.external_feature_model.vit.decoder.layers.4.self_attention.linear_qkv.bias lr_decay_rate 0.12157665459056935_get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.self_attention.linear_proj.bias key (0.0, 0.013508517176729929, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.mlp.linear_fc2.weight key (1.0, 0.012157665459056936, False, False) name module.module.external_feature_model.vit.decoder.layers.3.mlp.linear_fc1.weight lr_decay_rate 0.10941898913151242 name module.module.external_feature_model.vit.decoder.layers.3.self_attention.linear_qkv.weight lr_decay_rate 0.10941898913151242 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.input_layernorm.bias key (0.0, 0.00984770902183612, False, False)name module.module.external_feature_model.vit.decoder.layers.4.input_layernorm.weight lr_decay_rate 0.12157665459056935name module.module.external_feature_model.vit.decoder.layers.2.input_layernorm.weight lr_decay_rate 0.09847709021836118 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.ls1 key (0.0, 0.02058911320946491, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.self_attention.linear_qkv.bias key (0.0, 0.012157665459056936, False, False) name module.module.external_feature_model.vit.decoder.layers.4.mlp.linear_fc2.bias lr_decay_rate 0.12157665459056935name module.module.external_feature_model.vit.decoder.layers.5.self_attention.linear_qkv.weight lr_decay_rate 0.13508517176729928_get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.mlp.linear_fc1.weight key (1.0, 0.010941898913151242, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.self_attention.linear_qkv.weight key (1.0, 0.010941898913151242, False, False) name module.module.external_feature_model.vit.decoder.layers.5.self_attention.linear_proj.weight lr_decay_rate 0.13508517176729928 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.input_layernorm.weight key (0.0, 0.012157665459056936, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.input_layernorm.weight key (0.0, 0.00984770902183612, False, False) name module.module.external_feature_model.vit.decoder.layers.9.ls2 lr_decay_rate 0.20589113209464907_get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.mlp.linear_fc2.bias key (0.0, 0.012157665459056936, False, False) name module.module.external_feature_model.vit.decoder.layers.3.mlp.linear_fc1.bias lr_decay_rate 0.10941898913151242_get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.self_attention.linear_qkv.weight key (1.0, 0.013508517176729929, False, False)name module.module.external_feature_model.vit.decoder.layers.2.self_attention.linear_proj.weight lr_decay_rate 0.09847709021836118 name module.module.external_feature_model.vit.decoder.layers.3.self_attention.linear_qkv.bias lr_decay_rate 0.10941898913151242_get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.self_attention.linear_proj.weight key (1.0, 0.013508517176729929, False, False) name module.module.external_feature_model.vit.decoder.layers.4.input_layernorm.bias lr_decay_rate 0.12157665459056935name module.module.external_feature_model.vit.decoder.layers.4.pre_mlp_layernorm.weight lr_decay_rate 0.12157665459056935name module.module.external_feature_model.vit.decoder.layers.2.input_layernorm.bias lr_decay_rate 0.09847709021836118 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.ls2 key (0.0, 0.02058911320946491, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.mlp.linear_fc1.bias key (0.0, 0.010941898913151242, False, False) name module.module.external_feature_model.vit.decoder.layers.5.ls1 lr_decay_rate 0.13508517176729928 name module.module.external_feature_model.vit.decoder.layers.5.self_attention.linear_qkv.bias lr_decay_rate 0.13508517176729928_get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.self_attention.linear_qkv.bias key (0.0, 0.010941898913151242, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.self_attention.linear_proj.weight key (1.0, 0.00984770902183612, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.input_layernorm.bias key (0.0, 0.012157665459056936, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.input_layernorm.bias key (0.0, 0.00984770902183612, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.pre_mlp_layernorm.weight key (0.0, 0.012157665459056936, False, False)name module.module.external_feature_model.vit.decoder.layers.5.self_attention.linear_proj.bias lr_decay_rate 0.13508517176729928 name module.module.external_feature_model.vit.decoder.layers.9.input_layernorm.weight lr_decay_rate 0.20589113209464907 name module.module.external_feature_model.vit.decoder.layers.3.mlp.linear_fc2.weight lr_decay_rate 0.10941898913151242_get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.ls1 key (0.0, 0.013508517176729929, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.self_attention.linear_qkv.bias key (0.0, 0.013508517176729929, False, False) name module.module.external_feature_model.vit.decoder.layers.2.self_attention.linear_proj.bias lr_decay_rate 0.09847709021836118 name module.module.external_feature_model.vit.decoder.layers.3.pre_mlp_layernorm.weight lr_decay_rate 0.10941898913151242_get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.self_attention.linear_proj.bias key (0.0, 0.013508517176729929, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.input_layernorm.weight key (0.0, 0.02058911320946491, False, False) name module.module.external_feature_model.vit.decoder.layers.4.pre_mlp_layernorm.bias lr_decay_rate 0.12157665459056935 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.mlp.linear_fc2.weight key (1.0, 0.010941898913151242, False, False)name module.module.external_feature_model.vit.decoder.layers.4.self_attention.linear_proj.weight lr_decay_rate 0.12157665459056935 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.self_attention.linear_proj.bias key (0.0, 0.00984770902183612, False, False)name module.module.external_feature_model.vit.decoder.layers.5.ls2 lr_decay_rate 0.13508517176729928name module.module.external_feature_model.vit.decoder.layers.2.self_attention.linear_proj.weight lr_decay_rate 0.09847709021836118 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.pre_mlp_layernorm.weight key (0.0, 0.010941898913151242, False, False) name module.module.external_feature_model.vit.decoder.layers.5.pre_mlp_layernorm.weight lr_decay_rate 0.13508517176729928_get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.pre_mlp_layernorm.bias key (0.0, 0.012157665459056936, False, False)name module.module.external_feature_model.vit.decoder.layers.9.input_layernorm.bias lr_decay_rate 0.20589113209464907 name module.module.external_feature_model.vit.decoder.layers.3.mlp.linear_fc2.bias lr_decay_rate 0.10941898913151242name module.module.external_feature_model.vit.decoder.layers.5.self_attention.linear_qkv.weight lr_decay_rate 0.13508517176729928 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.self_attention.linear_proj.weight key (1.0, 0.012157665459056936, False, False) name module.module.external_feature_model.vit.decoder.layers.2.self_attention.linear_qkv.weight lr_decay_rate 0.09847709021836118name module.module.external_feature_model.vit.decoder.layers.3.pre_mlp_layernorm.bias lr_decay_rate 0.10941898913151242_get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.ls2 key (0.0, 0.013508517176729929, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.self_attention.linear_proj.weight key (1.0, 0.00984770902183612, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.input_layernorm.bias key (0.0, 0.02058911320946491, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.pre_mlp_layernorm.weight key (0.0, 0.013508517176729929, False, False)name module.module.external_feature_model.vit.decoder.layers.4.mlp.linear_fc1.weight lr_decay_rate 0.12157665459056935_get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.mlp.linear_fc2.bias key (0.0, 0.010941898913151242, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.self_attention.linear_qkv.weight key (1.0, 0.013508517176729929, False, False) name module.module.external_feature_model.vit.decoder.layers.4.self_attention.linear_proj.bias lr_decay_rate 0.12157665459056935 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.pre_mlp_layernorm.bias key (0.0, 0.010941898913151242, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.self_attention.linear_qkv.weight key (1.0, 0.00984770902183612, False, False) name module.module.external_feature_model.vit.decoder.layers.5.input_layernorm.weight lr_decay_rate 0.13508517176729928 name module.module.external_feature_model.vit.decoder.layers.9.self_attention.linear_proj.weight lr_decay_rate 0.20589113209464907 name module.module.external_feature_model.vit.decoder.layers.2.self_attention.linear_proj.bias lr_decay_rate 0.09847709021836118_get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.mlp.linear_fc1.weight key (1.0, 0.012157665459056936, False, False) name module.module.external_feature_model.vit.decoder.layers.5.pre_mlp_layernorm.bias lr_decay_rate 0.13508517176729928 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.self_attention.linear_proj.bias key (0.0, 0.012157665459056936, False, False)name module.module.external_feature_model.vit.decoder.layers.5.self_attention.linear_qkv.bias lr_decay_rate 0.13508517176729928name module.module.external_feature_model.vit.decoder.layers.4.ls1 lr_decay_rate 0.12157665459056935name module.module.external_feature_model.vit.decoder.layers.2.self_attention.linear_qkv.bias lr_decay_rate 0.09847709021836118 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.input_layernorm.weight key (0.0, 0.013508517176729929, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.self_attention.linear_proj.weight key (1.0, 0.02058911320946491, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.self_attention.linear_proj.bias key (0.0, 0.00984770902183612, False, False) name module.module.external_feature_model.vit.decoder.layers.3.mlp.linear_fc1.weight lr_decay_rate 0.10941898913151242 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.pre_mlp_layernorm.bias key (0.0, 0.013508517176729929, False, False) name module.module.external_feature_model.vit.decoder.layers.4.mlp.linear_fc1.bias lr_decay_rate 0.12157665459056935 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.ls1 key (0.0, 0.012157665459056936, False, False) name module.module.external_feature_model.vit.decoder.layers.5.input_layernorm.bias lr_decay_rate 0.13508517176729928_get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.self_attention.linear_qkv.bias key (0.0, 0.013508517176729929, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.self_attention.linear_qkv.bias key (0.0, 0.00984770902183612, False, False) name module.module.external_feature_model.vit.decoder.layers.4.self_attention.linear_qkv.weight lr_decay_rate 0.12157665459056935name module.module.external_feature_model.vit.decoder.layers.9.self_attention.linear_proj.bias lr_decay_rate 0.20589113209464907 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.mlp.linear_fc1.weight key (1.0, 0.010941898913151242, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.mlp.linear_fc1.bias key (0.0, 0.012157665459056936, False, False)name module.module.external_feature_model.vit.decoder.layers.2.self_attention.linear_qkv.weight lr_decay_rate 0.09847709021836118 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.input_layernorm.bias key (0.0, 0.013508517176729929, False, False)name module.module.external_feature_model.vit.decoder.layers.4.ls2 lr_decay_rate 0.12157665459056935 name module.module.external_feature_model.vit.decoder.layers.5.mlp.linear_fc1.weight lr_decay_rate 0.13508517176729928 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.self_attention.linear_proj.bias key (0.0, 0.02058911320946491, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.self_attention.linear_qkv.weight key (1.0, 0.012157665459056936, False, False) name module.module.external_feature_model.vit.decoder.layers.3.mlp.linear_fc1.bias lr_decay_rate 0.10941898913151242name module.module.external_feature_model.vit.decoder.layers.2.pre_mlp_layernorm.weight lr_decay_rate 0.09847709021836118name module.module.external_feature_model.vit.decoder.layers.5.pre_mlp_layernorm.weight lr_decay_rate 0.13508517176729928 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.self_attention.linear_qkv.weight key (1.0, 0.00984770902183612, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.mlp.linear_fc1.weight key (1.0, 0.013508517176729929, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.ls2 key (0.0, 0.012157665459056936, False, False)name module.module.external_feature_model.vit.decoder.layers.4.mlp.linear_fc2.weight lr_decay_rate 0.12157665459056935 name module.module.external_feature_model.vit.decoder.layers.4.self_attention.linear_qkv.bias lr_decay_rate 0.12157665459056935 name module.module.external_feature_model.vit.decoder.layers.9.self_attention.linear_qkv.weight lr_decay_rate 0.20589113209464907name module.module.external_feature_model.vit.decoder.layers.5.self_attention.linear_proj.weight lr_decay_rate 0.13508517176729928 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.mlp.linear_fc1.bias key (0.0, 0.010941898913151242, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.pre_mlp_layernorm.weight key (0.0, 0.00984770902183612, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.pre_mlp_layernorm.weight key (0.0, 0.013508517176729929, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.mlp.linear_fc2.weight key (1.0, 0.012157665459056936, False, False) name module.module.external_feature_model.vit.decoder.layers.2.self_attention.linear_qkv.bias lr_decay_rate 0.09847709021836118 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.self_attention.linear_qkv.bias key (0.0, 0.012157665459056936, False, False)name module.module.external_feature_model.vit.decoder.layers.5.mlp.linear_fc1.bias lr_decay_rate 0.13508517176729928_get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.self_attention.linear_qkv.weight key (1.0, 0.02058911320946491, False, False) name module.module.external_feature_model.vit.decoder.layers.4.input_layernorm.weight lr_decay_rate 0.12157665459056935 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.self_attention.linear_proj.weight key (1.0, 0.013508517176729929, False, False) name module.module.external_feature_model.vit.decoder.layers.2.pre_mlp_layernorm.bias lr_decay_rate 0.09847709021836118 name module.module.external_feature_model.vit.decoder.layers.3.mlp.linear_fc2.weight lr_decay_rate 0.10941898913151242name module.module.external_feature_model.vit.decoder.layers.5.pre_mlp_layernorm.bias lr_decay_rate 0.13508517176729928 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.self_attention.linear_qkv.bias key (0.0, 0.00984770902183612, False, False)name module.module.external_feature_model.vit.decoder.layers.4.mlp.linear_fc2.bias lr_decay_rate 0.12157665459056935 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.mlp.linear_fc1.bias key (0.0, 0.013508517176729929, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.input_layernorm.weight key (0.0, 0.012157665459056936, False, False) name module.module.external_feature_model.vit.decoder.layers.9.self_attention.linear_qkv.bias lr_decay_rate 0.20589113209464907_get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.pre_mlp_layernorm.bias key (0.0, 0.00984770902183612, False, False)name module.module.external_feature_model.vit.decoder.layers.4.pre_mlp_layernorm.weight lr_decay_rate 0.12157665459056935 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.pre_mlp_layernorm.bias key (0.0, 0.013508517176729929, False, False)name module.module.external_feature_model.vit.decoder.layers.5.self_attention.linear_proj.bias lr_decay_rate 0.13508517176729928 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.mlp.linear_fc2.weight key (1.0, 0.010941898913151242, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.mlp.linear_fc2.bias key (0.0, 0.012157665459056936, False, False) name module.module.external_feature_model.vit.decoder.layers.4.input_layernorm.bias lr_decay_rate 0.12157665459056935name module.module.external_feature_model.vit.decoder.layers.2.pre_mlp_layernorm.weight lr_decay_rate 0.09847709021836118 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.self_attention.linear_qkv.bias key (0.0, 0.02058911320946491, False, False)name module.module.external_feature_model.vit.decoder.layers.5.mlp.linear_fc2.weight lr_decay_rate 0.13508517176729928 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.self_attention.linear_proj.bias key (0.0, 0.013508517176729929, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.pre_mlp_layernorm.weight key (0.0, 0.012157665459056936, False, False)name module.module.external_feature_model.vit.decoder.layers.2.mlp.linear_fc1.weight lr_decay_rate 0.09847709021836118 name module.module.external_feature_model.vit.decoder.layers.5.mlp.linear_fc1.weight lr_decay_rate 0.13508517176729928name module.module.external_feature_model.vit.decoder.layers.3.mlp.linear_fc2.bias lr_decay_rate 0.10941898913151242 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.input_layernorm.bias key (0.0, 0.012157665459056936, False, False) name module.module.external_feature_model.vit.decoder.layers.5.ls1 lr_decay_rate 0.13508517176729928_get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.mlp.linear_fc2.weight key (1.0, 0.013508517176729929, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.pre_mlp_layernorm.weight key (0.0, 0.00984770902183612, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.mlp.linear_fc1.weight key (1.0, 0.00984770902183612, False, False) name module.module.external_feature_model.vit.decoder.layers.4.pre_mlp_layernorm.bias lr_decay_rate 0.12157665459056935_get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.mlp.linear_fc2.bias key (0.0, 0.010941898913151242, False, False) name module.module.external_feature_model.vit.decoder.layers.5.self_attention.linear_qkv.weight lr_decay_rate 0.13508517176729928_get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.mlp.linear_fc1.weight key (1.0, 0.013508517176729929, False, False) name module.module.external_feature_model.vit.decoder.layers.9.pre_mlp_layernorm.weight lr_decay_rate 0.20589113209464907 name module.module.external_feature_model.vit.decoder.layers.5.mlp.linear_fc2.bias lr_decay_rate 0.13508517176729928_get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.ls1 key (0.0, 0.013508517176729929, False, False) name module.module.external_feature_model.vit.decoder.layers.2.pre_mlp_layernorm.bias lr_decay_rate 0.09847709021836118name module.module.external_feature_model.vit.decoder.layers.4.self_attention.linear_proj.weight lr_decay_rate 0.12157665459056935 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.pre_mlp_layernorm.bias key (0.0, 0.012157665459056936, False, False)name module.module.external_feature_model.vit.decoder.layers.2.mlp.linear_fc1.bias lr_decay_rate 0.09847709021836118 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.self_attention.linear_qkv.weight key (1.0, 0.013508517176729929, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.mlp.linear_fc2.bias key (0.0, 0.013508517176729929, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.pre_mlp_layernorm.weight key (0.0, 0.02058911320946491, False, False) name module.module.external_feature_model.vit.decoder.layers.5.mlp.linear_fc1.bias lr_decay_rate 0.13508517176729928name module.module.external_feature_model.vit.decoder.layers.4.ls1 lr_decay_rate 0.12157665459056935_get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.mlp.linear_fc1.bias key (0.0, 0.00984770902183612, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.pre_mlp_layernorm.bias key (0.0, 0.00984770902183612, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.self_attention.linear_proj.weight key (1.0, 0.012157665459056936, False, False)name module.module.external_feature_model.vit.decoder.layers.5.ls2 lr_decay_rate 0.13508517176729928 name module.module.external_feature_model.vit.decoder.layers.4.mlp.linear_fc1.weight lr_decay_rate 0.12157665459056935name module.module.external_feature_model.vit.decoder.layers.5.self_attention.linear_qkv.bias lr_decay_rate 0.13508517176729928 name module.module.external_feature_model.vit.decoder.layers.9.pre_mlp_layernorm.bias lr_decay_rate 0.20589113209464907_get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.mlp.linear_fc1.bias key (0.0, 0.013508517176729929, False, False) name module.module.external_feature_model.vit.decoder.layers.6.ls1 lr_decay_rate 0.15009463529699918 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.ls1 key (0.0, 0.012157665459056936, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.ls2 key (0.0, 0.013508517176729929, False, False) name module.module.external_feature_model.vit.decoder.layers.2.mlp.linear_fc2.weight lr_decay_rate 0.09847709021836118 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.mlp.linear_fc1.weight key (1.0, 0.012157665459056936, False, False)name module.module.external_feature_model.vit.decoder.layers.4.self_attention.linear_proj.bias lr_decay_rate 0.12157665459056935 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.self_attention.linear_qkv.bias key (0.0, 0.013508517176729929, False, False)name module.module.external_feature_model.vit.decoder.layers.2.mlp.linear_fc1.weight lr_decay_rate 0.09847709021836118_get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.pre_mlp_layernorm.bias key (0.0, 0.02058911320946491, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.ls1 key (0.0, 0.015009463529699918, False, False) name module.module.external_feature_model.vit.decoder.layers.4.ls2 lr_decay_rate 0.12157665459056935 name module.module.external_feature_model.vit.decoder.layers.5.mlp.linear_fc2.weight lr_decay_rate 0.13508517176729928_get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.mlp.linear_fc2.weight key (1.0, 0.00984770902183612, False, False) name module.module.external_feature_model.vit.decoder.layers.4.mlp.linear_fc1.bias lr_decay_rate 0.12157665459056935_get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.self_attention.linear_proj.bias key (0.0, 0.012157665459056936, False, False)name module.module.external_feature_model.vit.decoder.layers.5.input_layernorm.weight lr_decay_rate 0.13508517176729928 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.mlp.linear_fc1.weight key (1.0, 0.00984770902183612, False, False) name module.module.external_feature_model.vit.decoder.layers.6.ls2 lr_decay_rate 0.15009463529699918 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.ls2 key (0.0, 0.012157665459056936, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.mlp.linear_fc2.weight key (1.0, 0.013508517176729929, False, False) name module.module.external_feature_model.vit.decoder.layers.2.mlp.linear_fc2.bias lr_decay_rate 0.09847709021836118 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.mlp.linear_fc1.bias key (0.0, 0.012157665459056936, False, False)name module.module.external_feature_model.vit.decoder.layers.9.mlp.linear_fc1.weight lr_decay_rate 0.20589113209464907name module.module.external_feature_model.vit.decoder.layers.5.pre_mlp_layernorm.weight lr_decay_rate 0.13508517176729928 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.input_layernorm.weight key (0.0, 0.013508517176729929, False, False) name module.module.external_feature_model.vit.decoder.layers.4.self_attention.linear_qkv.weight lr_decay_rate 0.12157665459056935 name module.module.external_feature_model.vit.decoder.layers.2.mlp.linear_fc1.bias lr_decay_rate 0.09847709021836118 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.ls2 key (0.0, 0.015009463529699918, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.mlp.linear_fc2.bias key (0.0, 0.00984770902183612, False, False) name module.module.external_feature_model.vit.decoder.layers.5.mlp.linear_fc2.bias lr_decay_rate 0.13508517176729928name module.module.external_feature_model.vit.decoder.layers.4.input_layernorm.weight lr_decay_rate 0.12157665459056935 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.mlp.linear_fc1.weight key (1.0, 0.02058911320946491, False, False)name module.module.external_feature_model.vit.decoder.layers.4.mlp.linear_fc2.weight lr_decay_rate 0.12157665459056935 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.pre_mlp_layernorm.weight key (0.0, 0.013508517176729929, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.mlp.linear_fc1.bias key (0.0, 0.00984770902183612, False, False)name module.module.external_feature_model.vit.decoder.layers.5.input_layernorm.bias lr_decay_rate 0.13508517176729928_get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.self_attention.linear_qkv.weight key (1.0, 0.012157665459056936, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.mlp.linear_fc2.bias key (0.0, 0.013508517176729929, False, False)name module.module.external_feature_model.vit.decoder.layers.6.input_layernorm.weight lr_decay_rate 0.15009463529699918 name module.module.external_feature_model.vit.decoder.layers.3.ls1 lr_decay_rate 0.10941898913151242 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.mlp.linear_fc2.weight key (1.0, 0.012157665459056936, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.input_layernorm.weight key (0.0, 0.012157665459056936, False, False)name module.module.external_feature_model.vit.decoder.layers.9.mlp.linear_fc1.bias lr_decay_rate 0.20589113209464907 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.input_layernorm.bias key (0.0, 0.013508517176729929, False, False)name module.module.external_feature_model.vit.decoder.layers.5.pre_mlp_layernorm.bias lr_decay_rate 0.13508517176729928 name module.module.external_feature_model.vit.decoder.layers.4.self_attention.linear_qkv.bias lr_decay_rate 0.12157665459056935name module.module.external_feature_model.vit.decoder.layers.2.mlp.linear_fc2.weight lr_decay_rate 0.09847709021836118 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.input_layernorm.weight key (0.0, 0.015009463529699918, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.ls1 key (0.0, 0.010941898913151242, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.mlp.linear_fc1.bias key (0.0, 0.02058911320946491, False, False)name module.module.external_feature_model.vit.decoder.layers.4.mlp.linear_fc2.bias lr_decay_rate 0.12157665459056935name module.module.external_feature_model.vit.decoder.layers.6.ls1 lr_decay_rate 0.15009463529699918name module.module.external_feature_model.vit.decoder.layers.4.input_layernorm.bias lr_decay_rate 0.12157665459056935 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.pre_mlp_layernorm.bias key (0.0, 0.013508517176729929, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.mlp.linear_fc2.weight key (1.0, 0.00984770902183612, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.self_attention.linear_qkv.bias key (0.0, 0.012157665459056936, False, False) name module.module.external_feature_model.vit.decoder.layers.6.input_layernorm.bias lr_decay_rate 0.15009463529699918 name module.module.external_feature_model.vit.decoder.layers.5.self_attention.linear_proj.weight lr_decay_rate 0.13508517176729928name module.module.external_feature_model.vit.decoder.layers.3.ls2 lr_decay_rate 0.10941898913151242 name module.module.external_feature_model.vit.decoder.layers.9.mlp.linear_fc2.weight lr_decay_rate 0.20589113209464907_get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.mlp.linear_fc2.bias key (0.0, 0.012157665459056936, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.input_layernorm.bias key (0.0, 0.012157665459056936, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.ls1 key (0.0, 0.015009463529699918, False, False) name module.module.external_feature_model.vit.decoder.layers.2.mlp.linear_fc2.bias lr_decay_rate 0.09847709021836118 name module.module.external_feature_model.vit.decoder.layers.5.mlp.linear_fc1.weight lr_decay_rate 0.13508517176729928 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.input_layernorm.bias key (0.0, 0.015009463529699918, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.self_attention.linear_proj.weight key (1.0, 0.013508517176729929, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.ls2 key (0.0, 0.010941898913151242, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.mlp.linear_fc2.weight key (1.0, 0.02058911320946491, False, False) name module.module.external_feature_model.vit.decoder.layers.4.pre_mlp_layernorm.weight lr_decay_rate 0.12157665459056935 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.mlp.linear_fc2.bias key (0.0, 0.00984770902183612, False, False)name module.module.external_feature_model.vit.decoder.layers.5.ls1 lr_decay_rate 0.13508517176729928 name module.module.external_feature_model.vit.decoder.layers.6.ls2 lr_decay_rate 0.15009463529699918name module.module.external_feature_model.vit.decoder.layers.4.self_attention.linear_proj.weight lr_decay_rate 0.12157665459056935_get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.mlp.linear_fc1.weight key (1.0, 0.013508517176729929, False, False) name module.module.external_feature_model.vit.decoder.layers.5.self_attention.linear_proj.bias lr_decay_rate 0.13508517176729928name module.module.external_feature_model.vit.decoder.layers.3.input_layernorm.weight lr_decay_rate 0.10941898913151242 name module.module.external_feature_model.vit.decoder.layers.9.mlp.linear_fc2.bias lr_decay_rate 0.20589113209464907_get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.pre_mlp_layernorm.weight key (0.0, 0.012157665459056936, False, False) name module.module.external_feature_model.vit.decoder.layers.6.self_attention.linear_proj.weight lr_decay_rate 0.15009463529699918 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.ls1 key (0.0, 0.013508517176729929, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.ls2 key (0.0, 0.015009463529699918, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.self_attention.linear_proj.weight key (1.0, 0.012157665459056936, False, False)name module.module.external_feature_model.vit.decoder.layers.5.mlp.linear_fc1.bias lr_decay_rate 0.13508517176729928 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.self_attention.linear_proj.bias key (0.0, 0.013508517176729929, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.input_layernorm.weight key (0.0, 0.010941898913151242, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.mlp.linear_fc2.bias key (0.0, 0.02058911320946491, False, False)name module.module.external_feature_model.vit.decoder.layers.4.pre_mlp_layernorm.bias lr_decay_rate 0.12157665459056935 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.self_attention.linear_proj.weight key (1.0, 0.015009463529699918, False, False) name module.module.external_feature_model.vit.decoder.layers.3.ls1 lr_decay_rate 0.10941898913151242 name module.module.external_feature_model.vit.decoder.layers.5.ls2 lr_decay_rate 0.13508517176729928name module.module.external_feature_model.vit.decoder.layers.4.self_attention.linear_proj.bias lr_decay_rate 0.12157665459056935 name module.module.external_feature_model.vit.decoder.layers.6.input_layernorm.weight lr_decay_rate 0.15009463529699918 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.mlp.linear_fc1.bias key (0.0, 0.013508517176729929, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.pre_mlp_layernorm.bias key (0.0, 0.012157665459056936, False, False) name module.module.external_feature_model.vit.decoder.layers.10.ls1 lr_decay_rate 0.2287679245496101 name module.module.external_feature_model.vit.decoder.layers.3.input_layernorm.bias lr_decay_rate 0.10941898913151242_get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.ls1 key (0.0, 0.010941898913151242, False, False) name module.module.external_feature_model.vit.decoder.layers.5.self_attention.linear_qkv.weight lr_decay_rate 0.13508517176729928 name module.module.external_feature_model.vit.decoder.layers.6.self_attention.linear_proj.bias lr_decay_rate 0.15009463529699918_get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.input_layernorm.weight key (0.0, 0.015009463529699918, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.ls2 key (0.0, 0.013508517176729929, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.self_attention.linear_proj.bias key (0.0, 0.012157665459056936, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.ls1 key (0.0, 0.02287679245496101, False, False) name module.module.external_feature_model.vit.decoder.layers.4.mlp.linear_fc1.weight lr_decay_rate 0.12157665459056935name module.module.external_feature_model.vit.decoder.layers.5.mlp.linear_fc2.weight lr_decay_rate 0.13508517176729928_get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.input_layernorm.bias key (0.0, 0.010941898913151242, False, False) name module.module.external_feature_model.vit.decoder.layers.3.ls2 lr_decay_rate 0.10941898913151242_get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.self_attention.linear_proj.bias key (0.0, 0.015009463529699918, False, False) name module.module.external_feature_model.vit.decoder.layers.6.input_layernorm.bias lr_decay_rate 0.15009463529699918_get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.self_attention.linear_qkv.weight key (1.0, 0.013508517176729929, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.mlp.linear_fc2.weight key (1.0, 0.013508517176729929, False, False)name module.module.external_feature_model.vit.decoder.layers.4.self_attention.linear_qkv.weight lr_decay_rate 0.12157665459056935name module.module.external_feature_model.vit.decoder.layers.5.input_layernorm.weight lr_decay_rate 0.13508517176729928 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.mlp.linear_fc1.weight key (1.0, 0.012157665459056936, False, False)name module.module.external_feature_model.vit.decoder.layers.10.ls2 lr_decay_rate 0.2287679245496101 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.ls2 key (0.0, 0.010941898913151242, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.input_layernorm.bias key (0.0, 0.015009463529699918, False, False)name module.module.external_feature_model.vit.decoder.layers.3.self_attention.linear_proj.weight lr_decay_rate 0.10941898913151242name module.module.external_feature_model.vit.decoder.layers.6.self_attention.linear_qkv.weight lr_decay_rate 0.15009463529699918 name module.module.external_feature_model.vit.decoder.layers.5.self_attention.linear_qkv.bias lr_decay_rate 0.13508517176729928 name module.module.external_feature_model.vit.decoder.layers.5.mlp.linear_fc2.bias lr_decay_rate 0.13508517176729928_get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.input_layernorm.weight key (0.0, 0.013508517176729929, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.self_attention.linear_qkv.weight key (1.0, 0.012157665459056936, False, False)name module.module.external_feature_model.vit.decoder.layers.4.mlp.linear_fc1.bias lr_decay_rate 0.12157665459056935_get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.ls2 key (0.0, 0.02287679245496101, False, False) name module.module.external_feature_model.vit.decoder.layers.3.input_layernorm.weight lr_decay_rate 0.10941898913151242_get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.self_attention.linear_proj.weight key (1.0, 0.010941898913151242, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.self_attention.linear_qkv.weight key (1.0, 0.015009463529699918, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.self_attention.linear_qkv.bias key (0.0, 0.013508517176729929, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.mlp.linear_fc1.bias key (0.0, 0.012157665459056936, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.mlp.linear_fc2.bias key (0.0, 0.013508517176729929, False, False)name module.module.external_feature_model.vit.decoder.layers.5.input_layernorm.bias lr_decay_rate 0.13508517176729928name module.module.external_feature_model.vit.decoder.layers.4.self_attention.linear_qkv.bias lr_decay_rate 0.12157665459056935 name module.module.external_feature_model.vit.decoder.layers.6.self_attention.linear_proj.weight lr_decay_rate 0.15009463529699918name module.module.external_feature_model.vit.decoder.layers.10.input_layernorm.weight lr_decay_rate 0.2287679245496101 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.input_layernorm.weight key (0.0, 0.010941898913151242, False, False) name module.module.external_feature_model.vit.decoder.layers.6.self_attention.linear_qkv.bias lr_decay_rate 0.15009463529699918 name module.module.external_feature_model.vit.decoder.layers.3.self_attention.linear_proj.bias lr_decay_rate 0.10941898913151242 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.input_layernorm.bias key (0.0, 0.013508517176729929, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.self_attention.linear_qkv.bias key (0.0, 0.012157665459056936, False, False) name module.module.external_feature_model.vit.decoder.layers.4.mlp.linear_fc2.weight lr_decay_rate 0.12157665459056935name module.module.external_feature_model.vit.decoder.layers.5.pre_mlp_layernorm.weight lr_decay_rate 0.13508517176729928_get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.input_layernorm.weight key (0.0, 0.02287679245496101, False, False) name module.module.external_feature_model.vit.decoder.layers.6.ls1 lr_decay_rate 0.15009463529699918 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.self_attention.linear_proj.weight key (1.0, 0.015009463529699918, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.self_attention.linear_qkv.bias key (0.0, 0.015009463529699918, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.self_attention.linear_proj.bias key (0.0, 0.010941898913151242, False, False)name module.module.external_feature_model.vit.decoder.layers.3.input_layernorm.bias lr_decay_rate 0.10941898913151242 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.mlp.linear_fc2.weight key (1.0, 0.012157665459056936, False, False) name module.module.external_feature_model.vit.decoder.layers.5.self_attention.linear_proj.weight lr_decay_rate 0.13508517176729928 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.ls1 key (0.0, 0.015009463529699918, False, False)name module.module.external_feature_model.vit.decoder.layers.4.pre_mlp_layernorm.weight lr_decay_rate 0.12157665459056935 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.pre_mlp_layernorm.weight key (0.0, 0.013508517176729929, False, False) name module.module.external_feature_model.vit.decoder.layers.10.input_layernorm.bias lr_decay_rate 0.2287679245496101 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.input_layernorm.bias key (0.0, 0.010941898913151242, False, False) name module.module.external_feature_model.vit.decoder.layers.6.self_attention.linear_proj.bias lr_decay_rate 0.15009463529699918name module.module.external_feature_model.vit.decoder.layers.4.mlp.linear_fc2.bias lr_decay_rate 0.12157665459056935 name module.module.external_feature_model.vit.decoder.layers.6.ls2 lr_decay_rate 0.15009463529699918_get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.self_attention.linear_proj.weight key (1.0, 0.013508517176729929, False, False) name module.module.external_feature_model.vit.decoder.layers.5.pre_mlp_layernorm.bias lr_decay_rate 0.13508517176729928name module.module.external_feature_model.vit.decoder.layers.3.self_attention.linear_qkv.weight lr_decay_rate 0.10941898913151242 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.pre_mlp_layernorm.weight key (0.0, 0.012157665459056936, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.input_layernorm.bias key (0.0, 0.02287679245496101, False, False)name module.module.external_feature_model.vit.decoder.layers.6.pre_mlp_layernorm.weight lr_decay_rate 0.15009463529699918 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.self_attention.linear_proj.bias key (0.0, 0.015009463529699918, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.ls2 key (0.0, 0.015009463529699918, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.mlp.linear_fc2.bias key (0.0, 0.012157665459056936, False, False) name module.module.external_feature_model.vit.decoder.layers.3.self_attention.linear_proj.weight lr_decay_rate 0.10941898913151242_get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.self_attention.linear_qkv.weight key (1.0, 0.010941898913151242, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.pre_mlp_layernorm.bias key (0.0, 0.013508517176729929, False, False)name module.module.external_feature_model.vit.decoder.layers.5.self_attention.linear_proj.bias lr_decay_rate 0.13508517176729928 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.pre_mlp_layernorm.weight key (0.0, 0.015009463529699918, False, False)name module.module.external_feature_model.vit.decoder.layers.4.pre_mlp_layernorm.bias lr_decay_rate 0.12157665459056935 name module.module.external_feature_model.vit.decoder.layers.6.self_attention.linear_qkv.weight lr_decay_rate 0.15009463529699918name module.module.external_feature_model.vit.decoder.layers.6.input_layernorm.weight lr_decay_rate 0.15009463529699918 name module.module.external_feature_model.vit.decoder.layers.10.self_attention.linear_proj.weight lr_decay_rate 0.2287679245496101name module.module.external_feature_model.vit.decoder.layers.5.ls1 lr_decay_rate 0.13508517176729928 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.self_attention.linear_proj.weight key (1.0, 0.010941898913151242, False, False) name module.module.external_feature_model.vit.decoder.layers.3.self_attention.linear_qkv.bias lr_decay_rate 0.10941898913151242 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.self_attention.linear_proj.bias key (0.0, 0.013508517176729929, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.pre_mlp_layernorm.bias key (0.0, 0.012157665459056936, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.self_attention.linear_qkv.weight key (1.0, 0.015009463529699918, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.input_layernorm.weight key (0.0, 0.015009463529699918, False, False) name module.module.external_feature_model.vit.decoder.layers.6.pre_mlp_layernorm.bias lr_decay_rate 0.15009463529699918name module.module.external_feature_model.vit.decoder.layers.5.mlp.linear_fc1.weight lr_decay_rate 0.13508517176729928 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.self_attention.linear_proj.weight key (1.0, 0.02287679245496101, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.ls1 key (0.0, 0.013508517176729929, False, False) name module.module.external_feature_model.vit.decoder.layers.3.self_attention.linear_proj.bias lr_decay_rate 0.10941898913151242 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.self_attention.linear_qkv.bias key (0.0, 0.010941898913151242, False, False) name module.module.external_feature_model.vit.decoder.layers.6.input_layernorm.bias lr_decay_rate 0.15009463529699918 name module.module.external_feature_model.vit.decoder.layers.5.self_attention.linear_qkv.weight lr_decay_rate 0.13508517176729928name module.module.external_feature_model.vit.decoder.layers.6.self_attention.linear_qkv.bias lr_decay_rate 0.15009463529699918name module.module.external_feature_model.vit.decoder.layers.4.mlp.linear_fc1.weight lr_decay_rate 0.12157665459056935_get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.pre_mlp_layernorm.bias key (0.0, 0.015009463529699918, False, False) name module.module.external_feature_model.vit.decoder.layers.10.self_attention.linear_proj.bias lr_decay_rate 0.2287679245496101_get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.mlp.linear_fc1.weight key (1.0, 0.013508517176729929, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.self_attention.linear_proj.bias key (0.0, 0.010941898913151242, False, False)name module.module.external_feature_model.vit.decoder.layers.5.ls2 lr_decay_rate 0.13508517176729928 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.input_layernorm.bias key (0.0, 0.015009463529699918, False, False)name module.module.external_feature_model.vit.decoder.layers.3.pre_mlp_layernorm.weight lr_decay_rate 0.10941898913151242 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.self_attention.linear_proj.bias key (0.0, 0.02287679245496101, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.mlp.linear_fc1.weight key (1.0, 0.012157665459056936, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.self_attention.linear_qkv.bias key (0.0, 0.015009463529699918, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.self_attention.linear_qkv.weight key (1.0, 0.013508517176729929, False, False) name module.module.external_feature_model.vit.decoder.layers.5.mlp.linear_fc1.bias lr_decay_rate 0.13508517176729928 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.ls2 key (0.0, 0.013508517176729929, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.pre_mlp_layernorm.weight key (0.0, 0.010941898913151242, False, False) name module.module.external_feature_model.vit.decoder.layers.6.mlp.linear_fc1.weight lr_decay_rate 0.15009463529699918 name module.module.external_feature_model.vit.decoder.layers.4.mlp.linear_fc1.bias lr_decay_rate 0.12157665459056935name module.module.external_feature_model.vit.decoder.layers.3.self_attention.linear_qkv.weight lr_decay_rate 0.10941898913151242 name module.module.external_feature_model.vit.decoder.layers.10.self_attention.linear_qkv.weight lr_decay_rate 0.2287679245496101_get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.mlp.linear_fc1.bias key (0.0, 0.013508517176729929, False, False)name module.module.external_feature_model.vit.decoder.layers.5.self_attention.linear_qkv.bias lr_decay_rate 0.13508517176729928name module.module.external_feature_model.vit.decoder.layers.6.self_attention.linear_proj.weight lr_decay_rate 0.15009463529699918 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.mlp.linear_fc1.weight key (1.0, 0.015009463529699918, False, False)name module.module.external_feature_model.vit.decoder.layers.3.pre_mlp_layernorm.bias lr_decay_rate 0.10941898913151242 name module.module.external_feature_model.vit.decoder.layers.6.pre_mlp_layernorm.weight lr_decay_rate 0.15009463529699918 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.mlp.linear_fc1.bias key (0.0, 0.012157665459056936, False, False)name module.module.external_feature_model.vit.decoder.layers.5.input_layernorm.weight lr_decay_rate 0.13508517176729928 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.self_attention.linear_qkv.bias key (0.0, 0.013508517176729929, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.self_attention.linear_qkv.weight key (1.0, 0.02287679245496101, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.self_attention.linear_qkv.weight key (1.0, 0.010941898913151242, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.pre_mlp_layernorm.bias key (0.0, 0.010941898913151242, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.self_attention.linear_proj.weight key (1.0, 0.015009463529699918, False, False)name module.module.external_feature_model.vit.decoder.layers.5.mlp.linear_fc2.weight lr_decay_rate 0.13508517176729928 name module.module.external_feature_model.vit.decoder.layers.6.mlp.linear_fc1.bias lr_decay_rate 0.15009463529699918 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.pre_mlp_layernorm.weight key (0.0, 0.015009463529699918, False, False) name module.module.external_feature_model.vit.decoder.layers.4.mlp.linear_fc2.weight lr_decay_rate 0.12157665459056935 name module.module.external_feature_model.vit.decoder.layers.10.self_attention.linear_qkv.bias lr_decay_rate 0.2287679245496101_get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.input_layernorm.weight key (0.0, 0.013508517176729929, False, False) name module.module.external_feature_model.vit.decoder.layers.3.self_attention.linear_qkv.bias lr_decay_rate 0.10941898913151242name module.module.external_feature_model.vit.decoder.layers.5.pre_mlp_layernorm.weight lr_decay_rate 0.13508517176729928 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.mlp.linear_fc2.weight key (1.0, 0.013508517176729929, False, False)name module.module.external_feature_model.vit.decoder.layers.3.mlp.linear_fc1.weight lr_decay_rate 0.10941898913151242_get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.mlp.linear_fc1.bias key (0.0, 0.015009463529699918, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.mlp.linear_fc2.weight key (1.0, 0.012157665459056936, False, False)name module.module.external_feature_model.vit.decoder.layers.6.self_attention.linear_proj.bias lr_decay_rate 0.15009463529699918 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.self_attention.linear_qkv.bias key (0.0, 0.02287679245496101, False, False)name module.module.external_feature_model.vit.decoder.layers.6.pre_mlp_layernorm.bias lr_decay_rate 0.15009463529699918 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.pre_mlp_layernorm.weight key (0.0, 0.013508517176729929, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.self_attention.linear_qkv.bias key (0.0, 0.010941898913151242, False, False) name module.module.external_feature_model.vit.decoder.layers.5.input_layernorm.bias lr_decay_rate 0.13508517176729928_get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.mlp.linear_fc1.weight key (1.0, 0.010941898913151242, False, False) name module.module.external_feature_model.vit.decoder.layers.5.mlp.linear_fc2.bias lr_decay_rate 0.13508517176729928 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.self_attention.linear_proj.bias key (0.0, 0.015009463529699918, False, False) name module.module.external_feature_model.vit.decoder.layers.4.mlp.linear_fc2.bias lr_decay_rate 0.12157665459056935 name module.module.external_feature_model.vit.decoder.layers.6.mlp.linear_fc2.weight lr_decay_rate 0.15009463529699918 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.pre_mlp_layernorm.bias key (0.0, 0.015009463529699918, False, False) name module.module.external_feature_model.vit.decoder.layers.5.pre_mlp_layernorm.bias lr_decay_rate 0.13508517176729928_get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.input_layernorm.bias key (0.0, 0.013508517176729929, False, False)name module.module.external_feature_model.vit.decoder.layers.3.mlp.linear_fc1.bias lr_decay_rate 0.10941898913151242_get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.mlp.linear_fc2.bias key (0.0, 0.012157665459056936, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.mlp.linear_fc2.bias key (0.0, 0.013508517176729929, False, False) name module.module.external_feature_model.vit.decoder.layers.6.self_attention.linear_qkv.weight lr_decay_rate 0.15009463529699918name module.module.external_feature_model.vit.decoder.layers.3.pre_mlp_layernorm.weight lr_decay_rate 0.10941898913151242name module.module.external_feature_model.vit.decoder.layers.10.pre_mlp_layernorm.weight lr_decay_rate 0.2287679245496101 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.mlp.linear_fc2.weight key (1.0, 0.015009463529699918, False, False) name module.module.external_feature_model.vit.decoder.layers.6.mlp.linear_fc1.weight lr_decay_rate 0.15009463529699918 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.pre_mlp_layernorm.bias key (0.0, 0.013508517176729929, False, False) name module.module.external_feature_model.vit.decoder.layers.5.ls1 lr_decay_rate 0.13508517176729928_get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.mlp.linear_fc1.bias key (0.0, 0.010941898913151242, False, False) name module.module.external_feature_model.vit.decoder.layers.6.ls1 lr_decay_rate 0.15009463529699918 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.self_attention.linear_qkv.weight key (1.0, 0.015009463529699918, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.pre_mlp_layernorm.weight key (0.0, 0.02287679245496101, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.mlp.linear_fc1.weight key (1.0, 0.015009463529699918, False, False) name module.module.external_feature_model.vit.decoder.layers.6.mlp.linear_fc2.bias lr_decay_rate 0.15009463529699918name module.module.external_feature_model.vit.decoder.layers.5.self_attention.linear_proj.weight lr_decay_rate 0.13508517176729928_get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.pre_mlp_layernorm.weight key (0.0, 0.010941898913151242, False, False) name module.module.external_feature_model.vit.decoder.layers.5.mlp.linear_fc1.weight lr_decay_rate 0.13508517176729928_get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.ls1 key (0.0, 0.013508517176729929, False, False) name module.module.external_feature_model.vit.decoder.layers.3.mlp.linear_fc2.weight lr_decay_rate 0.10941898913151242 name module.module.external_feature_model.vit.decoder.layers.6.self_attention.linear_qkv.bias lr_decay_rate 0.15009463529699918 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.ls1 key (0.0, 0.015009463529699918, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.self_attention.linear_proj.weight key (1.0, 0.013508517176729929, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.mlp.linear_fc2.bias key (0.0, 0.015009463529699918, False, False)name module.module.external_feature_model.vit.decoder.layers.10.pre_mlp_layernorm.bias lr_decay_rate 0.2287679245496101 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.mlp.linear_fc1.weight key (1.0, 0.013508517176729929, False, False)name module.module.external_feature_model.vit.decoder.layers.6.mlp.linear_fc1.bias lr_decay_rate 0.15009463529699918name module.module.external_feature_model.vit.decoder.layers.3.pre_mlp_layernorm.bias lr_decay_rate 0.10941898913151242 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.mlp.linear_fc2.weight key (1.0, 0.010941898913151242, False, False)name module.module.external_feature_model.vit.decoder.layers.5.ls2 lr_decay_rate 0.13508517176729928_get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.self_attention.linear_qkv.bias key (0.0, 0.015009463529699918, False, False) name module.module.external_feature_model.vit.decoder.layers.6.ls2 lr_decay_rate 0.15009463529699918 name module.module.external_feature_model.vit.decoder.layers.5.self_attention.linear_proj.bias lr_decay_rate 0.13508517176729928_get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.pre_mlp_layernorm.bias key (0.0, 0.010941898913151242, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.pre_mlp_layernorm.bias key (0.0, 0.02287679245496101, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.mlp.linear_fc1.bias key (0.0, 0.015009463529699918, False, False) name module.module.external_feature_model.vit.decoder.layers.5.mlp.linear_fc1.bias lr_decay_rate 0.13508517176729928name module.module.external_feature_model.vit.decoder.layers.7.ls1 lr_decay_rate 0.16677181699666577 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.ls2 key (0.0, 0.013508517176729929, False, False) name module.module.external_feature_model.vit.decoder.layers.3.mlp.linear_fc2.bias lr_decay_rate 0.10941898913151242_get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.ls2 key (0.0, 0.015009463529699918, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.self_attention.linear_proj.bias key (0.0, 0.013508517176729929, False, False) name module.module.external_feature_model.vit.decoder.layers.6.pre_mlp_layernorm.weight lr_decay_rate 0.15009463529699918 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.mlp.linear_fc1.bias key (0.0, 0.013508517176729929, False, False)name module.module.external_feature_model.vit.decoder.layers.6.mlp.linear_fc2.weight lr_decay_rate 0.15009463529699918name module.module.external_feature_model.vit.decoder.layers.3.mlp.linear_fc1.weight lr_decay_rate 0.10941898913151242name module.module.external_feature_model.vit.decoder.layers.10.mlp.linear_fc1.weight lr_decay_rate 0.2287679245496101 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.mlp.linear_fc2.bias key (0.0, 0.010941898913151242, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.ls1 key (0.0, 0.016677181699666577, False, False) name module.module.external_feature_model.vit.decoder.layers.5.input_layernorm.weight lr_decay_rate 0.13508517176729928_get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.pre_mlp_layernorm.weight key (0.0, 0.015009463529699918, False, False) name module.module.external_feature_model.vit.decoder.layers.6.input_layernorm.weight lr_decay_rate 0.15009463529699918name module.module.external_feature_model.vit.decoder.layers.5.self_attention.linear_qkv.weight lr_decay_rate 0.13508517176729928 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.mlp.linear_fc1.weight key (1.0, 0.010941898913151242, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.mlp.linear_fc2.weight key (1.0, 0.015009463529699918, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.mlp.linear_fc1.weight key (1.0, 0.02287679245496101, False, False)name module.module.external_feature_model.vit.decoder.layers.5.mlp.linear_fc2.weight lr_decay_rate 0.13508517176729928 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.input_layernorm.weight key (0.0, 0.013508517176729929, False, False) name module.module.external_feature_model.vit.decoder.layers.7.ls2 lr_decay_rate 0.16677181699666577name module.module.external_feature_model.vit.decoder.layers.4.ls1 lr_decay_rate 0.12157665459056935_get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.self_attention.linear_qkv.weight key (1.0, 0.013508517176729929, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.input_layernorm.weight key (0.0, 0.015009463529699918, False, False)name module.module.external_feature_model.vit.decoder.layers.6.pre_mlp_layernorm.bias lr_decay_rate 0.15009463529699918 name module.module.external_feature_model.vit.decoder.layers.6.mlp.linear_fc2.bias lr_decay_rate 0.15009463529699918name module.module.external_feature_model.vit.decoder.layers.10.mlp.linear_fc1.bias lr_decay_rate 0.2287679245496101 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.mlp.linear_fc2.weight key (1.0, 0.013508517176729929, False, False) name module.module.external_feature_model.vit.decoder.layers.3.mlp.linear_fc1.bias lr_decay_rate 0.10941898913151242 name module.module.external_feature_model.vit.decoder.layers.5.input_layernorm.bias lr_decay_rate 0.13508517176729928_get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.ls2 key (0.0, 0.016677181699666577, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.ls1 key (0.0, 0.012157665459056936, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.mlp.linear_fc2.bias key (0.0, 0.015009463529699918, False, False)name module.module.external_feature_model.vit.decoder.layers.5.self_attention.linear_qkv.bias lr_decay_rate 0.13508517176729928_get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.pre_mlp_layernorm.bias key (0.0, 0.015009463529699918, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.mlp.linear_fc1.bias key (0.0, 0.010941898913151242, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.mlp.linear_fc1.bias key (0.0, 0.02287679245496101, False, False)name module.module.external_feature_model.vit.decoder.layers.5.mlp.linear_fc2.bias lr_decay_rate 0.13508517176729928_get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.input_layernorm.bias key (0.0, 0.013508517176729929, False, False) name module.module.external_feature_model.vit.decoder.layers.6.input_layernorm.bias lr_decay_rate 0.15009463529699918 name module.module.external_feature_model.vit.decoder.layers.4.ls2 lr_decay_rate 0.12157665459056935name module.module.external_feature_model.vit.decoder.layers.7.input_layernorm.weight lr_decay_rate 0.16677181699666577 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.self_attention.linear_qkv.bias key (0.0, 0.013508517176729929, False, False) name module.module.external_feature_model.vit.decoder.layers.7.ls1 lr_decay_rate 0.16677181699666577 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.mlp.linear_fc2.bias key (0.0, 0.013508517176729929, False, False) name module.module.external_feature_model.vit.decoder.layers.6.mlp.linear_fc1.weight lr_decay_rate 0.15009463529699918_get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.input_layernorm.bias key (0.0, 0.015009463529699918, False, False)name module.module.external_feature_model.vit.decoder.layers.3.mlp.linear_fc2.weight lr_decay_rate 0.10941898913151242 name module.module.external_feature_model.vit.decoder.layers.10.mlp.linear_fc2.weight lr_decay_rate 0.2287679245496101 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.ls2 key (0.0, 0.012157665459056936, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.input_layernorm.weight key (0.0, 0.016677181699666577, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.ls1 key (0.0, 0.016677181699666577, False, False)name module.module.external_feature_model.vit.decoder.layers.5.self_attention.linear_proj.weight lr_decay_rate 0.13508517176729928 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.mlp.linear_fc1.weight key (1.0, 0.015009463529699918, False, False)name module.module.external_feature_model.vit.decoder.layers.5.pre_mlp_layernorm.weight lr_decay_rate 0.13508517176729928 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.mlp.linear_fc2.weight key (1.0, 0.010941898913151242, False, False) name module.module.external_feature_model.vit.decoder.layers.6.ls1 lr_decay_rate 0.15009463529699918_get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.mlp.linear_fc2.weight key (1.0, 0.02287679245496101, False, False) name module.module.external_feature_model.vit.decoder.layers.4.input_layernorm.weight lr_decay_rate 0.12157665459056935name module.module.external_feature_model.vit.decoder.layers.7.input_layernorm.bias lr_decay_rate 0.16677181699666577 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.self_attention.linear_proj.weight key (1.0, 0.013508517176729929, False, False) name module.module.external_feature_model.vit.decoder.layers.6.self_attention.linear_proj.weight lr_decay_rate 0.15009463529699918name module.module.external_feature_model.vit.decoder.layers.7.ls2 lr_decay_rate 0.16677181699666577_get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.pre_mlp_layernorm.weight key (0.0, 0.013508517176729929, False, False)name module.module.external_feature_model.vit.decoder.layers.6.mlp.linear_fc1.bias lr_decay_rate 0.15009463529699918 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.ls1 key (0.0, 0.015009463529699918, False, False)name module.module.external_feature_model.vit.decoder.layers.10.mlp.linear_fc2.bias lr_decay_rate 0.2287679245496101_get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.input_layernorm.weight key (0.0, 0.012157665459056936, False, False) name module.module.external_feature_model.vit.decoder.layers.3.mlp.linear_fc2.bias lr_decay_rate 0.10941898913151242 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.input_layernorm.bias key (0.0, 0.016677181699666577, False, False)name module.module.external_feature_model.vit.decoder.layers.5.self_attention.linear_proj.bias lr_decay_rate 0.13508517176729928_get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.mlp.linear_fc1.bias key (0.0, 0.015009463529699918, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.self_attention.linear_proj.weight key (1.0, 0.015009463529699918, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.ls2 key (0.0, 0.016677181699666577, False, False)name module.module.external_feature_model.vit.decoder.layers.5.pre_mlp_layernorm.bias lr_decay_rate 0.13508517176729928 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.mlp.linear_fc2.bias key (0.0, 0.02287679245496101, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.mlp.linear_fc2.bias key (0.0, 0.010941898913151242, False, False) name module.module.external_feature_model.vit.decoder.layers.4.input_layernorm.bias lr_decay_rate 0.12157665459056935 name module.module.external_feature_model.vit.decoder.layers.6.ls2 lr_decay_rate 0.15009463529699918 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.self_attention.linear_proj.bias key (0.0, 0.013508517176729929, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.pre_mlp_layernorm.bias key (0.0, 0.013508517176729929, False, False)name module.module.external_feature_model.vit.decoder.layers.6.mlp.linear_fc2.weight lr_decay_rate 0.15009463529699918 name module.module.external_feature_model.vit.decoder.layers.6.self_attention.linear_proj.bias lr_decay_rate 0.15009463529699918name module.module.external_feature_model.vit.decoder.layers.7.self_attention.linear_proj.weight lr_decay_rate 0.16677181699666577_get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.input_layernorm.bias key (0.0, 0.012157665459056936, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.ls2 key (0.0, 0.015009463529699918, False, False)name module.module.external_feature_model.vit.decoder.layers.7.input_layernorm.weight lr_decay_rate 0.16677181699666577name module.module.external_feature_model.vit.decoder.layers.4.ls1 lr_decay_rate 0.12157665459056935name module.module.external_feature_model.vit.decoder.layers.11.ls1 lr_decay_rate 0.2541865828329001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.mlp.linear_fc2.weight key (1.0, 0.015009463529699918, False, False)name module.module.external_feature_model.vit.decoder.layers.5.mlp.linear_fc1.weight lr_decay_rate 0.13508517176729928name module.module.external_feature_model.vit.decoder.layers.5.self_attention.linear_qkv.weight lr_decay_rate 0.13508517176729928 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.self_attention.linear_proj.bias key (0.0, 0.015009463529699918, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.self_attention.linear_proj.weight key (1.0, 0.016677181699666577, False, False) name module.module.external_feature_model.vit.decoder.layers.4.self_attention.linear_proj.weight lr_decay_rate 0.12157665459056935 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.ls1 key (0.0, 0.02541865828329001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.input_layernorm.weight key (0.0, 0.016677181699666577, False, False) name module.module.external_feature_model.vit.decoder.layers.6.input_layernorm.weight lr_decay_rate 0.15009463529699918_get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.self_attention.linear_qkv.weight key (1.0, 0.013508517176729929, False, False)name module.module.external_feature_model.vit.decoder.layers.6.mlp.linear_fc2.bias lr_decay_rate 0.15009463529699918_get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.ls1 key (0.0, 0.012157665459056936, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.mlp.linear_fc1.weight key (1.0, 0.013508517176729929, False, False) name module.module.external_feature_model.vit.decoder.layers.7.self_attention.linear_proj.bias lr_decay_rate 0.16677181699666577 name module.module.external_feature_model.vit.decoder.layers.6.self_attention.linear_qkv.weight lr_decay_rate 0.15009463529699918 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.self_attention.linear_proj.weight key (1.0, 0.012157665459056936, False, False)name module.module.external_feature_model.vit.decoder.layers.7.input_layernorm.bias lr_decay_rate 0.16677181699666577name module.module.external_feature_model.vit.decoder.layers.11.ls2 lr_decay_rate 0.2541865828329001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.input_layernorm.weight key (0.0, 0.015009463529699918, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.mlp.linear_fc2.bias key (0.0, 0.015009463529699918, False, False) name module.module.external_feature_model.vit.decoder.layers.5.self_attention.linear_qkv.bias lr_decay_rate 0.13508517176729928 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.self_attention.linear_proj.bias key (0.0, 0.016677181699666577, False, False)name module.module.external_feature_model.vit.decoder.layers.4.ls2 lr_decay_rate 0.12157665459056935_get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.self_attention.linear_qkv.weight key (1.0, 0.015009463529699918, False, False) name module.module.external_feature_model.vit.decoder.layers.5.mlp.linear_fc1.bias lr_decay_rate 0.13508517176729928 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.ls2 key (0.0, 0.02541865828329001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.input_layernorm.bias key (0.0, 0.016677181699666577, False, False) name module.module.external_feature_model.vit.decoder.layers.6.input_layernorm.bias lr_decay_rate 0.15009463529699918 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.self_attention.linear_qkv.bias key (0.0, 0.013508517176729929, False, False)name module.module.external_feature_model.vit.decoder.layers.4.self_attention.linear_proj.bias lr_decay_rate 0.12157665459056935 name module.module.external_feature_model.vit.decoder.layers.7.ls1 lr_decay_rate 0.16677181699666577 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.ls2 key (0.0, 0.012157665459056936, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.mlp.linear_fc1.bias key (0.0, 0.013508517176729929, False, False)name module.module.external_feature_model.vit.decoder.layers.7.self_attention.linear_qkv.weight lr_decay_rate 0.16677181699666577name module.module.external_feature_model.vit.decoder.layers.6.self_attention.linear_qkv.bias lr_decay_rate 0.15009463529699918 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.input_layernorm.bias key (0.0, 0.015009463529699918, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.self_attention.linear_proj.bias key (0.0, 0.012157665459056936, False, False)name module.module.external_feature_model.vit.decoder.layers.11.input_layernorm.weight lr_decay_rate 0.2541865828329001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.ls1 key (0.0, 0.016677181699666577, False, False) name module.module.external_feature_model.vit.decoder.layers.7.self_attention.linear_proj.weight lr_decay_rate 0.16677181699666577 name module.module.external_feature_model.vit.decoder.layers.5.pre_mlp_layernorm.weight lr_decay_rate 0.13508517176729928 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.self_attention.linear_qkv.bias key (0.0, 0.015009463529699918, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.self_attention.linear_qkv.weight key (1.0, 0.016677181699666577, False, False)name module.module.external_feature_model.vit.decoder.layers.4.input_layernorm.weight lr_decay_rate 0.12157665459056935 name module.module.external_feature_model.vit.decoder.layers.5.mlp.linear_fc2.weight lr_decay_rate 0.13508517176729928_get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.input_layernorm.weight key (0.0, 0.02541865828329001, False, False) name module.module.external_feature_model.vit.decoder.layers.7.ls2 lr_decay_rate 0.16677181699666577name module.module.external_feature_model.vit.decoder.layers.4.self_attention.linear_qkv.weight lr_decay_rate 0.12157665459056935_get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.self_attention.linear_proj.weight key (1.0, 0.016677181699666577, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.pre_mlp_layernorm.weight key (0.0, 0.013508517176729929, False, False)name module.module.external_feature_model.vit.decoder.layers.6.self_attention.linear_proj.weight lr_decay_rate 0.15009463529699918 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.input_layernorm.weight key (0.0, 0.012157665459056936, False, False) name module.module.external_feature_model.vit.decoder.layers.7.self_attention.linear_qkv.bias lr_decay_rate 0.16677181699666577 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.mlp.linear_fc2.weight key (1.0, 0.013508517176729929, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.ls2 key (0.0, 0.016677181699666577, False, False)name module.module.external_feature_model.vit.decoder.layers.11.input_layernorm.bias lr_decay_rate 0.2541865828329001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.self_attention.linear_qkv.weight key (1.0, 0.012157665459056936, False, False)name module.module.external_feature_model.vit.decoder.layers.6.pre_mlp_layernorm.weight lr_decay_rate 0.15009463529699918 name module.module.external_feature_model.vit.decoder.layers.7.self_attention.linear_proj.bias lr_decay_rate 0.16677181699666577 name module.module.external_feature_model.vit.decoder.layers.5.pre_mlp_layernorm.bias lr_decay_rate 0.13508517176729928 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.self_attention.linear_qkv.bias key (0.0, 0.016677181699666577, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.self_attention.linear_proj.weight key (1.0, 0.015009463529699918, False, False)name module.module.external_feature_model.vit.decoder.layers.5.mlp.linear_fc2.bias lr_decay_rate 0.13508517176729928_get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.input_layernorm.bias key (0.0, 0.02541865828329001, False, False)name module.module.external_feature_model.vit.decoder.layers.4.input_layernorm.bias lr_decay_rate 0.12157665459056935 name module.module.external_feature_model.vit.decoder.layers.7.input_layernorm.weight lr_decay_rate 0.16677181699666577 name module.module.external_feature_model.vit.decoder.layers.4.self_attention.linear_qkv.bias lr_decay_rate 0.12157665459056935_get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.pre_mlp_layernorm.weight key (0.0, 0.015009463529699918, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.self_attention.linear_proj.bias key (0.0, 0.016677181699666577, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.pre_mlp_layernorm.bias key (0.0, 0.013508517176729929, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.mlp.linear_fc2.bias key (0.0, 0.013508517176729929, False, False) name module.module.external_feature_model.vit.decoder.layers.6.self_attention.linear_proj.bias lr_decay_rate 0.15009463529699918_get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.self_attention.linear_qkv.bias key (0.0, 0.012157665459056936, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.input_layernorm.bias key (0.0, 0.012157665459056936, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.input_layernorm.weight key (0.0, 0.016677181699666577, False, False)name module.module.external_feature_model.vit.decoder.layers.7.pre_mlp_layernorm.weight lr_decay_rate 0.16677181699666577 name module.module.external_feature_model.vit.decoder.layers.11.self_attention.linear_proj.weight lr_decay_rate 0.2541865828329001name module.module.external_feature_model.vit.decoder.layers.7.self_attention.linear_qkv.weight lr_decay_rate 0.16677181699666577name module.module.external_feature_model.vit.decoder.layers.5.mlp.linear_fc1.weight lr_decay_rate 0.13508517176729928 name module.module.external_feature_model.vit.decoder.layers.6.pre_mlp_layernorm.bias lr_decay_rate 0.15009463529699918 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.self_attention.linear_proj.bias key (0.0, 0.015009463529699918, False, False)name module.module.external_feature_model.vit.decoder.layers.6.ls1 lr_decay_rate 0.15009463529699918 name module.module.external_feature_model.vit.decoder.layers.7.input_layernorm.bias lr_decay_rate 0.16677181699666577name module.module.external_feature_model.vit.decoder.layers.4.pre_mlp_layernorm.weight lr_decay_rate 0.12157665459056935 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.pre_mlp_layernorm.weight key (0.0, 0.016677181699666577, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.self_attention.linear_proj.weight key (1.0, 0.02541865828329001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.self_attention.linear_qkv.weight key (1.0, 0.016677181699666577, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.pre_mlp_layernorm.bias key (0.0, 0.015009463529699918, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.ls1 key (0.0, 0.015009463529699918, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.mlp.linear_fc1.weight key (1.0, 0.013508517176729929, False, False) name module.module.external_feature_model.vit.decoder.layers.4.self_attention.linear_proj.weight lr_decay_rate 0.12157665459056935 name module.module.external_feature_model.vit.decoder.layers.6.self_attention.linear_qkv.weight lr_decay_rate 0.15009463529699918_get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.input_layernorm.bias key (0.0, 0.016677181699666577, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.pre_mlp_layernorm.weight key (0.0, 0.012157665459056936, False, False)name module.module.external_feature_model.vit.decoder.layers.7.pre_mlp_layernorm.bias lr_decay_rate 0.16677181699666577 name module.module.external_feature_model.vit.decoder.layers.11.self_attention.linear_proj.bias lr_decay_rate 0.2541865828329001 name module.module.external_feature_model.vit.decoder.layers.7.self_attention.linear_qkv.bias lr_decay_rate 0.16677181699666577name module.module.external_feature_model.vit.decoder.layers.6.mlp.linear_fc1.weight lr_decay_rate 0.15009463529699918name module.module.external_feature_model.vit.decoder.layers.6.ls2 lr_decay_rate 0.15009463529699918_get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.self_attention.linear_proj.weight key (1.0, 0.012157665459056936, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.self_attention.linear_qkv.weight key (1.0, 0.015009463529699918, False, False) name module.module.external_feature_model.vit.decoder.layers.5.mlp.linear_fc1.bias lr_decay_rate 0.13508517176729928_get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.pre_mlp_layernorm.bias key (0.0, 0.016677181699666577, False, False) name module.module.external_feature_model.vit.decoder.layers.4.pre_mlp_layernorm.bias lr_decay_rate 0.12157665459056935name module.module.external_feature_model.vit.decoder.layers.7.self_attention.linear_proj.weight lr_decay_rate 0.16677181699666577 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.self_attention.linear_proj.bias key (0.0, 0.02541865828329001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.ls2 key (0.0, 0.015009463529699918, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.self_attention.linear_qkv.bias key (0.0, 0.016677181699666577, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.mlp.linear_fc1.weight key (1.0, 0.015009463529699918, False, False) name module.module.external_feature_model.vit.decoder.layers.6.self_attention.linear_qkv.bias lr_decay_rate 0.15009463529699918 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.mlp.linear_fc1.bias key (0.0, 0.013508517176729929, False, False) name module.module.external_feature_model.vit.decoder.layers.4.self_attention.linear_proj.bias lr_decay_rate 0.12157665459056935_get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.pre_mlp_layernorm.bias key (0.0, 0.012157665459056936, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.self_attention.linear_proj.weight key (1.0, 0.016677181699666577, False, False) name module.module.external_feature_model.vit.decoder.layers.7.mlp.linear_fc1.weight lr_decay_rate 0.16677181699666577 name module.module.external_feature_model.vit.decoder.layers.11.self_attention.linear_qkv.weight lr_decay_rate 0.2541865828329001name module.module.external_feature_model.vit.decoder.layers.6.input_layernorm.weight lr_decay_rate 0.15009463529699918_get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.self_attention.linear_qkv.bias key (0.0, 0.015009463529699918, False, False) name module.module.external_feature_model.vit.decoder.layers.6.mlp.linear_fc1.bias lr_decay_rate 0.15009463529699918name module.module.external_feature_model.vit.decoder.layers.5.mlp.linear_fc2.weight lr_decay_rate 0.13508517176729928_get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.self_attention.linear_proj.bias key (0.0, 0.012157665459056936, False, False) name module.module.external_feature_model.vit.decoder.layers.7.pre_mlp_layernorm.weight lr_decay_rate 0.16677181699666577 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.mlp.linear_fc1.weight key (1.0, 0.016677181699666577, False, False)name module.module.external_feature_model.vit.decoder.layers.7.self_attention.linear_proj.bias lr_decay_rate 0.16677181699666577name module.module.external_feature_model.vit.decoder.layers.4.mlp.linear_fc1.weight lr_decay_rate 0.12157665459056935_get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.input_layernorm.weight key (0.0, 0.015009463529699918, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.self_attention.linear_qkv.weight key (1.0, 0.02541865828329001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.mlp.linear_fc2.weight key (1.0, 0.013508517176729929, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.mlp.linear_fc1.bias key (0.0, 0.015009463529699918, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.pre_mlp_layernorm.weight key (0.0, 0.016677181699666577, False, False) name module.module.external_feature_model.vit.decoder.layers.6.pre_mlp_layernorm.weight lr_decay_rate 0.15009463529699918name module.module.external_feature_model.vit.decoder.layers.4.self_attention.linear_qkv.weight lr_decay_rate 0.12157665459056935 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.self_attention.linear_proj.bias key (0.0, 0.016677181699666577, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.mlp.linear_fc1.weight key (1.0, 0.012157665459056936, False, False) name module.module.external_feature_model.vit.decoder.layers.11.self_attention.linear_qkv.bias lr_decay_rate 0.2541865828329001 name module.module.external_feature_model.vit.decoder.layers.6.input_layernorm.bias lr_decay_rate 0.15009463529699918name module.module.external_feature_model.vit.decoder.layers.7.mlp.linear_fc1.bias lr_decay_rate 0.16677181699666577 name module.module.external_feature_model.vit.decoder.layers.7.pre_mlp_layernorm.bias lr_decay_rate 0.16677181699666577 name module.module.external_feature_model.vit.decoder.layers.6.mlp.linear_fc2.weight lr_decay_rate 0.15009463529699918 name module.module.external_feature_model.vit.decoder.layers.5.mlp.linear_fc2.bias lr_decay_rate 0.13508517176729928 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.self_attention.linear_qkv.weight key (1.0, 0.012157665459056936, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.pre_mlp_layernorm.weight key (0.0, 0.015009463529699918, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.self_attention.linear_qkv.bias key (0.0, 0.02541865828329001, False, False) name module.module.external_feature_model.vit.decoder.layers.4.mlp.linear_fc1.bias lr_decay_rate 0.12157665459056935_get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.pre_mlp_layernorm.bias key (0.0, 0.016677181699666577, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.mlp.linear_fc1.bias key (0.0, 0.016677181699666577, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.input_layernorm.bias key (0.0, 0.015009463529699918, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.mlp.linear_fc2.bias key (0.0, 0.013508517176729929, False, False) name module.module.external_feature_model.vit.decoder.layers.7.self_attention.linear_qkv.weight lr_decay_rate 0.16677181699666577 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.mlp.linear_fc2.weight key (1.0, 0.015009463529699918, False, False) name module.module.external_feature_model.vit.decoder.layers.4.self_attention.linear_qkv.bias lr_decay_rate 0.12157665459056935name module.module.external_feature_model.vit.decoder.layers.6.pre_mlp_layernorm.bias lr_decay_rate 0.15009463529699918_get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.mlp.linear_fc1.bias key (0.0, 0.012157665459056936, False, False) name module.module.external_feature_model.vit.decoder.layers.7.mlp.linear_fc1.weight lr_decay_rate 0.16677181699666577name module.module.external_feature_model.vit.decoder.layers.11.pre_mlp_layernorm.weight lr_decay_rate 0.2541865828329001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.self_attention.linear_qkv.weight key (1.0, 0.016677181699666577, False, False) name module.module.external_feature_model.vit.decoder.layers.6.self_attention.linear_proj.weight lr_decay_rate 0.15009463529699918 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.pre_mlp_layernorm.bias key (0.0, 0.015009463529699918, False, False)name module.module.external_feature_model.vit.decoder.layers.6.mlp.linear_fc2.bias lr_decay_rate 0.15009463529699918name module.module.external_feature_model.vit.decoder.layers.7.mlp.linear_fc2.weight lr_decay_rate 0.16677181699666577_get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.self_attention.linear_qkv.bias key (0.0, 0.012157665459056936, False, False) name module.module.external_feature_model.vit.decoder.layers.6.ls1 lr_decay_rate 0.15009463529699918 name module.module.external_feature_model.vit.decoder.layers.4.mlp.linear_fc2.weight lr_decay_rate 0.12157665459056935 name module.module.external_feature_model.vit.decoder.layers.7.self_attention.linear_qkv.bias lr_decay_rate 0.16677181699666577 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.pre_mlp_layernorm.weight key (0.0, 0.02541865828329001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.mlp.linear_fc1.weight key (1.0, 0.016677181699666577, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.self_attention.linear_proj.weight key (1.0, 0.015009463529699918, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.mlp.linear_fc2.weight key (1.0, 0.016677181699666577, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.mlp.linear_fc2.bias key (0.0, 0.015009463529699918, False, False) name module.module.external_feature_model.vit.decoder.layers.6.mlp.linear_fc1.weight lr_decay_rate 0.15009463529699918_get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.ls1 key (0.0, 0.015009463529699918, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.mlp.linear_fc2.weight key (1.0, 0.012157665459056936, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.self_attention.linear_qkv.bias key (0.0, 0.016677181699666577, False, False)name module.module.external_feature_model.vit.decoder.layers.11.pre_mlp_layernorm.bias lr_decay_rate 0.2541865828329001 name module.module.external_feature_model.vit.decoder.layers.4.pre_mlp_layernorm.weight lr_decay_rate 0.12157665459056935 name module.module.external_feature_model.vit.decoder.layers.6.self_attention.linear_proj.bias lr_decay_rate 0.15009463529699918name module.module.external_feature_model.vit.decoder.layers.7.mlp.linear_fc2.bias lr_decay_rate 0.16677181699666577 name module.module.external_feature_model.vit.decoder.layers.7.mlp.linear_fc1.bias lr_decay_rate 0.16677181699666577_get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.mlp.linear_fc1.weight key (1.0, 0.015009463529699918, False, False)name module.module.external_feature_model.vit.decoder.layers.7.ls1 lr_decay_rate 0.16677181699666577 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.pre_mlp_layernorm.bias key (0.0, 0.02541865828329001, False, False)name module.module.external_feature_model.vit.decoder.layers.6.ls2 lr_decay_rate 0.15009463529699918name module.module.external_feature_model.vit.decoder.layers.4.mlp.linear_fc2.bias lr_decay_rate 0.12157665459056935 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.pre_mlp_layernorm.weight key (0.0, 0.012157665459056936, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.mlp.linear_fc2.bias key (0.0, 0.016677181699666577, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.self_attention.linear_proj.bias key (0.0, 0.015009463529699918, False, False)name module.module.external_feature_model.vit.decoder.layers.7.pre_mlp_layernorm.weight lr_decay_rate 0.16677181699666577 name module.module.external_feature_model.vit.decoder.layers.6.mlp.linear_fc1.bias lr_decay_rate 0.15009463529699918 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.mlp.linear_fc1.bias key (0.0, 0.016677181699666577, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.ls1 key (0.0, 0.016677181699666577, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.mlp.linear_fc2.bias key (0.0, 0.012157665459056936, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.ls2 key (0.0, 0.015009463529699918, False, False) name module.module.external_feature_model.vit.decoder.layers.11.mlp.linear_fc1.weight lr_decay_rate 0.2541865828329001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.mlp.linear_fc1.bias key (0.0, 0.015009463529699918, False, False)name module.module.external_feature_model.vit.decoder.layers.4.pre_mlp_layernorm.bias lr_decay_rate 0.12157665459056935 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.pre_mlp_layernorm.weight key (0.0, 0.016677181699666577, False, False) name module.module.external_feature_model.vit.decoder.layers.6.self_attention.linear_qkv.weight lr_decay_rate 0.15009463529699918name module.module.external_feature_model.vit.decoder.layers.8.ls1 lr_decay_rate 0.18530201888518416 name module.module.external_feature_model.vit.decoder.layers.7.mlp.linear_fc2.weight lr_decay_rate 0.16677181699666577 name module.module.external_feature_model.vit.decoder.layers.6.input_layernorm.weight lr_decay_rate 0.15009463529699918name module.module.external_feature_model.vit.decoder.layers.7.ls2 lr_decay_rate 0.16677181699666577_get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.mlp.linear_fc1.weight key (1.0, 0.02541865828329001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.pre_mlp_layernorm.bias key (0.0, 0.012157665459056936, False, False) name module.module.external_feature_model.vit.decoder.layers.5.ls1 lr_decay_rate 0.13508517176729928 name module.module.external_feature_model.vit.decoder.layers.6.mlp.linear_fc2.weight lr_decay_rate 0.15009463529699918 name module.module.external_feature_model.vit.decoder.layers.7.pre_mlp_layernorm.bias lr_decay_rate 0.16677181699666577 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.self_attention.linear_qkv.weight key (1.0, 0.015009463529699918, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.ls1 key (0.0, 0.018530201888518418, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.input_layernorm.weight key (0.0, 0.015009463529699918, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.mlp.linear_fc2.weight key (1.0, 0.016677181699666577, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.ls2 key (0.0, 0.016677181699666577, False, False) name module.module.external_feature_model.vit.decoder.layers.11.mlp.linear_fc1.bias lr_decay_rate 0.2541865828329001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.ls1 key (0.0, 0.013508517176729929, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.mlp.linear_fc2.weight key (1.0, 0.015009463529699918, False, False)name module.module.external_feature_model.vit.decoder.layers.4.mlp.linear_fc1.weight lr_decay_rate 0.12157665459056935 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.pre_mlp_layernorm.bias key (0.0, 0.016677181699666577, False, False) name module.module.external_feature_model.vit.decoder.layers.6.self_attention.linear_qkv.bias lr_decay_rate 0.15009463529699918 name module.module.external_feature_model.vit.decoder.layers.8.ls2 lr_decay_rate 0.18530201888518416name module.module.external_feature_model.vit.decoder.layers.6.input_layernorm.bias lr_decay_rate 0.15009463529699918 name module.module.external_feature_model.vit.decoder.layers.7.mlp.linear_fc2.bias lr_decay_rate 0.16677181699666577 name module.module.external_feature_model.vit.decoder.layers.7.input_layernorm.weight lr_decay_rate 0.16677181699666577 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.mlp.linear_fc1.weight key (1.0, 0.012157665459056936, False, False)name module.module.external_feature_model.vit.decoder.layers.6.mlp.linear_fc2.bias lr_decay_rate 0.15009463529699918_get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.mlp.linear_fc1.bias key (0.0, 0.02541865828329001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.self_attention.linear_qkv.bias key (0.0, 0.015009463529699918, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.input_layernorm.bias key (0.0, 0.015009463529699918, False, False)name module.module.external_feature_model.vit.decoder.layers.5.ls2 lr_decay_rate 0.13508517176729928_get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.mlp.linear_fc2.bias key (0.0, 0.016677181699666577, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.ls2 key (0.0, 0.018530201888518418, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.input_layernorm.weight key (0.0, 0.016677181699666577, False, False) name module.module.external_feature_model.vit.decoder.layers.7.mlp.linear_fc1.weight lr_decay_rate 0.16677181699666577 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.mlp.linear_fc2.bias key (0.0, 0.015009463529699918, False, False) name module.module.external_feature_model.vit.decoder.layers.4.mlp.linear_fc1.bias lr_decay_rate 0.12157665459056935 name module.module.external_feature_model.vit.decoder.layers.11.mlp.linear_fc2.weight lr_decay_rate 0.2541865828329001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.mlp.linear_fc1.weight key (1.0, 0.016677181699666577, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.ls2 key (0.0, 0.013508517176729929, False, False)name module.module.external_feature_model.vit.decoder.layers.7.input_layernorm.bias lr_decay_rate 0.16677181699666577name module.module.external_feature_model.vit.decoder.layers.6.self_attention.linear_proj.weight lr_decay_rate 0.15009463529699918 name module.module.external_feature_model.vit.decoder.layers.6.pre_mlp_layernorm.weight lr_decay_rate 0.15009463529699918 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.mlp.linear_fc1.bias key (0.0, 0.012157665459056936, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.mlp.linear_fc2.weight key (1.0, 0.02541865828329001, False, False)name module.module.external_feature_model.vit.decoder.layers.7.ls1 lr_decay_rate 0.16677181699666577name module.module.external_feature_model.vit.decoder.layers.8.ls1 lr_decay_rate 0.18530201888518416 name module.module.external_feature_model.vit.decoder.layers.8.input_layernorm.weight lr_decay_rate 0.18530201888518416 name module.module.external_feature_model.vit.decoder.layers.7.mlp.linear_fc1.bias lr_decay_rate 0.16677181699666577 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.input_layernorm.bias key (0.0, 0.016677181699666577, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.self_attention.linear_proj.weight key (1.0, 0.015009463529699918, False, False)name module.module.external_feature_model.vit.decoder.layers.5.input_layernorm.weight lr_decay_rate 0.13508517176729928 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.pre_mlp_layernorm.weight key (0.0, 0.015009463529699918, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.input_layernorm.weight key (0.0, 0.018530201888518418, False, False) name module.module.external_feature_model.vit.decoder.layers.11.mlp.linear_fc2.bias lr_decay_rate 0.2541865828329001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.ls1 key (0.0, 0.016677181699666577, False, False) name module.module.external_feature_model.vit.decoder.layers.4.mlp.linear_fc2.weight lr_decay_rate 0.12157665459056935_get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.mlp.linear_fc1.bias key (0.0, 0.016677181699666577, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.ls1 key (0.0, 0.018530201888518418, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.input_layernorm.weight key (0.0, 0.013508517176729929, False, False)name module.module.external_feature_model.vit.decoder.layers.6.pre_mlp_layernorm.bias lr_decay_rate 0.15009463529699918name module.module.external_feature_model.vit.decoder.layers.6.self_attention.linear_proj.bias lr_decay_rate 0.15009463529699918 name module.module.external_feature_model.vit.decoder.layers.7.self_attention.linear_proj.weight lr_decay_rate 0.16677181699666577name module.module.external_feature_model.vit.decoder.layers.8.input_layernorm.bias lr_decay_rate 0.18530201888518416name module.module.external_feature_model.vit.decoder.layers.7.ls2 lr_decay_rate 0.16677181699666577_get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.mlp.linear_fc2.bias key (0.0, 0.02541865828329001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.pre_mlp_layernorm.bias key (0.0, 0.015009463529699918, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.mlp.linear_fc2.weight key (1.0, 0.012157665459056936, False, False) name module.module.external_feature_model.vit.decoder.layers.5.input_layernorm.bias lr_decay_rate 0.13508517176729928name module.module.external_feature_model.vit.decoder.layers.7.mlp.linear_fc2.weight lr_decay_rate 0.16677181699666577 name module.module.external_feature_model.vit.decoder.layers.8.ls2 lr_decay_rate 0.18530201888518416 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.self_attention.linear_proj.bias key (0.0, 0.015009463529699918, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.input_layernorm.bias key (0.0, 0.018530201888518418, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.self_attention.linear_proj.weight key (1.0, 0.016677181699666577, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.ls2 key (0.0, 0.016677181699666577, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.ls2 key (0.0, 0.018530201888518418, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.input_layernorm.bias key (0.0, 0.013508517176729929, False, False) name module.module.external_feature_model.vit.decoder.layers.4.mlp.linear_fc2.bias lr_decay_rate 0.12157665459056935name module.module.external_feature_model.vit.decoder.layers.12.ls1 lr_decay_rate 0.2824295364810001name module.module.external_feature_model.vit.decoder.layers.6.mlp.linear_fc1.weight lr_decay_rate 0.15009463529699918 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.mlp.linear_fc2.weight key (1.0, 0.016677181699666577, False, False) name module.module.external_feature_model.vit.decoder.layers.7.self_attention.linear_proj.bias lr_decay_rate 0.16677181699666577name module.module.external_feature_model.vit.decoder.layers.6.self_attention.linear_qkv.weight lr_decay_rate 0.15009463529699918 name module.module.external_feature_model.vit.decoder.layers.7.input_layernorm.weight lr_decay_rate 0.16677181699666577name module.module.external_feature_model.vit.decoder.layers.8.self_attention.linear_proj.weight lr_decay_rate 0.18530201888518416name module.module.external_feature_model.vit.decoder.layers.8.input_layernorm.weight lr_decay_rate 0.18530201888518416 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.mlp.linear_fc2.bias key (0.0, 0.012157665459056936, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.mlp.linear_fc1.weight key (1.0, 0.015009463529699918, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.self_attention.linear_qkv.weight key (1.0, 0.015009463529699918, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.ls1 key (0.0, 0.028242953648100012, False, False)name module.module.external_feature_model.vit.decoder.layers.5.self_attention.linear_proj.weight lr_decay_rate 0.13508517176729928_get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.self_attention.linear_proj.bias key (0.0, 0.016677181699666577, False, False) name module.module.external_feature_model.vit.decoder.layers.7.mlp.linear_fc2.bias lr_decay_rate 0.16677181699666577 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.input_layernorm.weight key (0.0, 0.016677181699666577, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.self_attention.linear_proj.weight key (1.0, 0.018530201888518418, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.input_layernorm.weight key (0.0, 0.018530201888518418, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.self_attention.linear_proj.weight key (1.0, 0.013508517176729929, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.mlp.linear_fc2.bias key (0.0, 0.016677181699666577, False, False) name module.module.external_feature_model.vit.decoder.layers.6.self_attention.linear_qkv.bias lr_decay_rate 0.15009463529699918name module.module.external_feature_model.vit.decoder.layers.12.ls2 lr_decay_rate 0.2824295364810001name module.module.external_feature_model.vit.decoder.layers.5.ls1 lr_decay_rate 0.13508517176729928name module.module.external_feature_model.vit.decoder.layers.6.mlp.linear_fc1.bias lr_decay_rate 0.15009463529699918 name module.module.external_feature_model.vit.decoder.layers.7.self_attention.linear_qkv.weight lr_decay_rate 0.16677181699666577 name module.module.external_feature_model.vit.decoder.layers.7.input_layernorm.bias lr_decay_rate 0.16677181699666577name module.module.external_feature_model.vit.decoder.layers.8.self_attention.linear_proj.bias lr_decay_rate 0.18530201888518416name module.module.external_feature_model.vit.decoder.layers.8.input_layernorm.bias lr_decay_rate 0.18530201888518416 name module.module.external_feature_model.vit.decoder.layers.5.self_attention.linear_proj.bias lr_decay_rate 0.13508517176729928_get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.self_attention.linear_qkv.bias key (0.0, 0.015009463529699918, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.ls2 key (0.0, 0.028242953648100012, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.ls1 key (0.0, 0.013508517176729929, False, False)name module.module.external_feature_model.vit.decoder.layers.8.ls1 lr_decay_rate 0.18530201888518416 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.mlp.linear_fc1.bias key (0.0, 0.015009463529699918, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.input_layernorm.bias key (0.0, 0.018530201888518418, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.input_layernorm.bias key (0.0, 0.016677181699666577, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.self_attention.linear_proj.bias key (0.0, 0.018530201888518418, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.self_attention.linear_qkv.weight key (1.0, 0.016677181699666577, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.self_attention.linear_proj.bias key (0.0, 0.013508517176729929, False, False) name module.module.external_feature_model.vit.decoder.layers.12.input_layernorm.weight lr_decay_rate 0.2824295364810001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.ls1 key (0.0, 0.018530201888518418, False, False) name module.module.external_feature_model.vit.decoder.layers.5.ls2 lr_decay_rate 0.13508517176729928name module.module.external_feature_model.vit.decoder.layers.6.pre_mlp_layernorm.weight lr_decay_rate 0.15009463529699918name module.module.external_feature_model.vit.decoder.layers.6.mlp.linear_fc2.weight lr_decay_rate 0.15009463529699918 name module.module.external_feature_model.vit.decoder.layers.7.self_attention.linear_qkv.bias lr_decay_rate 0.16677181699666577 name module.module.external_feature_model.vit.decoder.layers.8.self_attention.linear_proj.weight lr_decay_rate 0.18530201888518416name module.module.external_feature_model.vit.decoder.layers.8.self_attention.linear_qkv.weight lr_decay_rate 0.18530201888518416_get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.input_layernorm.weight key (0.0, 0.028242953648100012, False, False) name module.module.external_feature_model.vit.decoder.layers.5.self_attention.linear_qkv.weight lr_decay_rate 0.13508517176729928 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.ls2 key (0.0, 0.013508517176729929, False, False)name module.module.external_feature_model.vit.decoder.layers.7.self_attention.linear_proj.weight lr_decay_rate 0.16677181699666577 name module.module.external_feature_model.vit.decoder.layers.8.ls2 lr_decay_rate 0.18530201888518416 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.mlp.linear_fc2.weight key (1.0, 0.015009463529699918, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.self_attention.linear_qkv.bias key (0.0, 0.016677181699666577, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.pre_mlp_layernorm.weight key (0.0, 0.015009463529699918, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.self_attention.linear_proj.weight key (1.0, 0.018530201888518418, False, False) name module.module.external_feature_model.vit.decoder.layers.12.input_layernorm.bias lr_decay_rate 0.2824295364810001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.self_attention.linear_qkv.weight key (1.0, 0.018530201888518418, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.self_attention.linear_qkv.weight key (1.0, 0.013508517176729929, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.ls2 key (0.0, 0.018530201888518418, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.self_attention.linear_proj.weight key (1.0, 0.016677181699666577, False, False) name module.module.external_feature_model.vit.decoder.layers.6.mlp.linear_fc2.bias lr_decay_rate 0.15009463529699918name module.module.external_feature_model.vit.decoder.layers.5.input_layernorm.weight lr_decay_rate 0.13508517176729928 name module.module.external_feature_model.vit.decoder.layers.8.self_attention.linear_proj.bias lr_decay_rate 0.18530201888518416 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.input_layernorm.bias key (0.0, 0.028242953648100012, False, False)name module.module.external_feature_model.vit.decoder.layers.6.pre_mlp_layernorm.bias lr_decay_rate 0.15009463529699918 name module.module.external_feature_model.vit.decoder.layers.8.self_attention.linear_qkv.bias lr_decay_rate 0.18530201888518416name module.module.external_feature_model.vit.decoder.layers.5.self_attention.linear_qkv.bias lr_decay_rate 0.13508517176729928 name module.module.external_feature_model.vit.decoder.layers.7.pre_mlp_layernorm.weight lr_decay_rate 0.16677181699666577name module.module.external_feature_model.vit.decoder.layers.7.self_attention.linear_proj.bias lr_decay_rate 0.16677181699666577_get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.mlp.linear_fc2.bias key (0.0, 0.015009463529699918, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.pre_mlp_layernorm.bias key (0.0, 0.015009463529699918, False, False)name module.module.external_feature_model.vit.decoder.layers.8.input_layernorm.weight lr_decay_rate 0.18530201888518416_get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.self_attention.linear_proj.bias key (0.0, 0.018530201888518418, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.input_layernorm.weight key (0.0, 0.013508517176729929, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.self_attention.linear_qkv.bias key (0.0, 0.018530201888518418, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.self_attention.linear_qkv.bias key (0.0, 0.013508517176729929, False, False) name module.module.external_feature_model.vit.decoder.layers.12.self_attention.linear_proj.weight lr_decay_rate 0.2824295364810001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.pre_mlp_layernorm.weight key (0.0, 0.016677181699666577, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.self_attention.linear_proj.bias key (0.0, 0.016677181699666577, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.input_layernorm.weight key (0.0, 0.018530201888518418, False, False)name module.module.external_feature_model.vit.decoder.layers.7.ls1 lr_decay_rate 0.16677181699666577 name module.module.external_feature_model.vit.decoder.layers.6.mlp.linear_fc1.weight lr_decay_rate 0.15009463529699918name module.module.external_feature_model.vit.decoder.layers.5.input_layernorm.bias lr_decay_rate 0.13508517176729928name module.module.external_feature_model.vit.decoder.layers.8.self_attention.linear_qkv.weight lr_decay_rate 0.18530201888518416 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.self_attention.linear_proj.weight key (1.0, 0.028242953648100012, False, False) name module.module.external_feature_model.vit.decoder.layers.8.pre_mlp_layernorm.weight lr_decay_rate 0.18530201888518416name module.module.external_feature_model.vit.decoder.layers.7.pre_mlp_layernorm.bias lr_decay_rate 0.16677181699666577name module.module.external_feature_model.vit.decoder.layers.5.pre_mlp_layernorm.weight lr_decay_rate 0.13508517176729928name module.module.external_feature_model.vit.decoder.layers.7.self_attention.linear_qkv.weight lr_decay_rate 0.16677181699666577 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.ls1 key (0.0, 0.016677181699666577, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.mlp.linear_fc1.weight key (1.0, 0.015009463529699918, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.input_layernorm.bias key (0.0, 0.013508517176729929, False, False) name module.module.external_feature_model.vit.decoder.layers.8.input_layernorm.bias lr_decay_rate 0.18530201888518416 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.self_attention.linear_qkv.weight key (1.0, 0.018530201888518418, False, False) name module.module.external_feature_model.vit.decoder.layers.12.self_attention.linear_proj.bias lr_decay_rate 0.2824295364810001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.pre_mlp_layernorm.bias key (0.0, 0.016677181699666577, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.pre_mlp_layernorm.weight key (0.0, 0.018530201888518418, False, False) name module.module.external_feature_model.vit.decoder.layers.6.mlp.linear_fc1.bias lr_decay_rate 0.15009463529699918_get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.pre_mlp_layernorm.weight key (0.0, 0.013508517176729929, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.self_attention.linear_qkv.weight key (1.0, 0.016677181699666577, False, False) name module.module.external_feature_model.vit.decoder.layers.7.ls2 lr_decay_rate 0.16677181699666577_get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.input_layernorm.bias key (0.0, 0.018530201888518418, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.self_attention.linear_proj.bias key (0.0, 0.028242953648100012, False, False) name module.module.external_feature_model.vit.decoder.layers.8.self_attention.linear_qkv.bias lr_decay_rate 0.18530201888518416 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.mlp.linear_fc1.bias key (0.0, 0.015009463529699918, False, False) name module.module.external_feature_model.vit.decoder.layers.8.pre_mlp_layernorm.bias lr_decay_rate 0.18530201888518416 name module.module.external_feature_model.vit.decoder.layers.7.mlp.linear_fc1.weight lr_decay_rate 0.16677181699666577name module.module.external_feature_model.vit.decoder.layers.5.pre_mlp_layernorm.bias lr_decay_rate 0.13508517176729928 name module.module.external_feature_model.vit.decoder.layers.7.self_attention.linear_qkv.bias lr_decay_rate 0.16677181699666577name module.module.external_feature_model.vit.decoder.layers.5.self_attention.linear_proj.weight lr_decay_rate 0.13508517176729928_get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.ls2 key (0.0, 0.016677181699666577, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.self_attention.linear_qkv.bias key (0.0, 0.018530201888518418, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.pre_mlp_layernorm.bias key (0.0, 0.018530201888518418, False, False)name module.module.external_feature_model.vit.decoder.layers.12.self_attention.linear_qkv.weight lr_decay_rate 0.2824295364810001 name module.module.external_feature_model.vit.decoder.layers.6.mlp.linear_fc2.weight lr_decay_rate 0.15009463529699918_get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.mlp.linear_fc1.weight key (1.0, 0.016677181699666577, False, False) name module.module.external_feature_model.vit.decoder.layers.8.self_attention.linear_proj.weight lr_decay_rate 0.18530201888518416 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.pre_mlp_layernorm.bias key (0.0, 0.013508517176729929, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.self_attention.linear_qkv.bias key (0.0, 0.016677181699666577, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.self_attention.linear_proj.weight key (1.0, 0.013508517176729929, False, False)name module.module.external_feature_model.vit.decoder.layers.7.input_layernorm.weight lr_decay_rate 0.16677181699666577 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.mlp.linear_fc2.weight key (1.0, 0.015009463529699918, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.self_attention.linear_proj.weight key (1.0, 0.018530201888518418, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.self_attention.linear_qkv.weight key (1.0, 0.028242953648100012, False, False)name module.module.external_feature_model.vit.decoder.layers.8.pre_mlp_layernorm.weight lr_decay_rate 0.18530201888518416 name module.module.external_feature_model.vit.decoder.layers.8.mlp.linear_fc1.weight lr_decay_rate 0.18530201888518416 name module.module.external_feature_model.vit.decoder.layers.7.mlp.linear_fc1.bias lr_decay_rate 0.16677181699666577 name module.module.external_feature_model.vit.decoder.layers.5.mlp.linear_fc1.weight lr_decay_rate 0.13508517176729928 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.input_layernorm.weight key (0.0, 0.016677181699666577, False, False) name module.module.external_feature_model.vit.decoder.layers.6.mlp.linear_fc2.bias lr_decay_rate 0.15009463529699918name module.module.external_feature_model.vit.decoder.layers.5.self_attention.linear_proj.bias lr_decay_rate 0.13508517176729928 name module.module.external_feature_model.vit.decoder.layers.7.pre_mlp_layernorm.weight lr_decay_rate 0.16677181699666577 name module.module.external_feature_model.vit.decoder.layers.8.self_attention.linear_proj.bias lr_decay_rate 0.18530201888518416_get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.pre_mlp_layernorm.weight key (0.0, 0.018530201888518418, False, False)name module.module.external_feature_model.vit.decoder.layers.12.self_attention.linear_qkv.bias lr_decay_rate 0.2824295364810001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.mlp.linear_fc1.weight key (1.0, 0.018530201888518418, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.mlp.linear_fc1.weight key (1.0, 0.013508517176729929, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.mlp.linear_fc1.bias key (0.0, 0.016677181699666577, False, False) name module.module.external_feature_model.vit.decoder.layers.7.input_layernorm.bias lr_decay_rate 0.16677181699666577_get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.mlp.linear_fc2.bias key (0.0, 0.015009463529699918, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.self_attention.linear_proj.bias key (0.0, 0.013508517176729929, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.pre_mlp_layernorm.weight key (0.0, 0.016677181699666577, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.self_attention.linear_proj.bias key (0.0, 0.018530201888518418, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.self_attention.linear_qkv.bias key (0.0, 0.028242953648100012, False, False) name module.module.external_feature_model.vit.decoder.layers.8.pre_mlp_layernorm.bias lr_decay_rate 0.18530201888518416name module.module.external_feature_model.vit.decoder.layers.8.mlp.linear_fc1.bias lr_decay_rate 0.18530201888518416 name module.module.external_feature_model.vit.decoder.layers.5.mlp.linear_fc1.bias lr_decay_rate 0.13508517176729928 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.input_layernorm.bias key (0.0, 0.016677181699666577, False, False)name module.module.external_feature_model.vit.decoder.layers.7.mlp.linear_fc2.weight lr_decay_rate 0.16677181699666577 name module.module.external_feature_model.vit.decoder.layers.7.pre_mlp_layernorm.bias lr_decay_rate 0.16677181699666577name module.module.external_feature_model.vit.decoder.layers.7.ls1 lr_decay_rate 0.16677181699666577 name module.module.external_feature_model.vit.decoder.layers.5.self_attention.linear_qkv.weight lr_decay_rate 0.13508517176729928 name module.module.external_feature_model.vit.decoder.layers.8.self_attention.linear_qkv.weight lr_decay_rate 0.18530201888518416_get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.pre_mlp_layernorm.bias key (0.0, 0.018530201888518418, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.mlp.linear_fc1.bias key (0.0, 0.018530201888518418, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.mlp.linear_fc1.bias key (0.0, 0.013508517176729929, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.mlp.linear_fc2.weight key (1.0, 0.016677181699666577, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.pre_mlp_layernorm.bias key (0.0, 0.016677181699666577, False, False)name module.module.external_feature_model.vit.decoder.layers.12.pre_mlp_layernorm.weight lr_decay_rate 0.2824295364810001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.ls1 key (0.0, 0.016677181699666577, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.self_attention.linear_qkv.weight key (1.0, 0.013508517176729929, False, False)name module.module.external_feature_model.vit.decoder.layers.7.self_attention.linear_proj.weight lr_decay_rate 0.16677181699666577 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.self_attention.linear_qkv.weight key (1.0, 0.018530201888518418, False, False) name module.module.external_feature_model.vit.decoder.layers.8.mlp.linear_fc1.weight lr_decay_rate 0.18530201888518416name module.module.external_feature_model.vit.decoder.layers.5.mlp.linear_fc2.weight lr_decay_rate 0.13508517176729928_get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.pre_mlp_layernorm.weight key (0.0, 0.028242953648100012, False, False) name module.module.external_feature_model.vit.decoder.layers.7.mlp.linear_fc2.bias lr_decay_rate 0.16677181699666577name module.module.external_feature_model.vit.decoder.layers.8.mlp.linear_fc2.weight lr_decay_rate 0.18530201888518416name module.module.external_feature_model.vit.decoder.layers.7.mlp.linear_fc1.weight lr_decay_rate 0.16677181699666577 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.self_attention.linear_proj.weight key (1.0, 0.016677181699666577, False, False)name module.module.external_feature_model.vit.decoder.layers.5.self_attention.linear_qkv.bias lr_decay_rate 0.13508517176729928name module.module.external_feature_model.vit.decoder.layers.8.self_attention.linear_qkv.bias lr_decay_rate 0.18530201888518416name module.module.external_feature_model.vit.decoder.layers.7.ls2 lr_decay_rate 0.16677181699666577 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.mlp.linear_fc1.weight key (1.0, 0.018530201888518418, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.mlp.linear_fc2.weight key (1.0, 0.013508517176729929, False, False) name module.module.external_feature_model.vit.decoder.layers.12.pre_mlp_layernorm.bias lr_decay_rate 0.2824295364810001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.mlp.linear_fc2.bias key (0.0, 0.016677181699666577, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.mlp.linear_fc2.weight key (1.0, 0.018530201888518418, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.mlp.linear_fc1.weight key (1.0, 0.016677181699666577, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.self_attention.linear_qkv.bias key (0.0, 0.018530201888518418, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.ls2 key (0.0, 0.016677181699666577, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.self_attention.linear_qkv.bias key (0.0, 0.013508517176729929, False, False)name module.module.external_feature_model.vit.decoder.layers.7.self_attention.linear_proj.bias lr_decay_rate 0.16677181699666577name module.module.external_feature_model.vit.decoder.layers.8.mlp.linear_fc1.bias lr_decay_rate 0.18530201888518416 name module.module.external_feature_model.vit.decoder.layers.5.mlp.linear_fc2.bias lr_decay_rate 0.13508517176729928_get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.pre_mlp_layernorm.bias key (0.0, 0.028242953648100012, False, False) name module.module.external_feature_model.vit.decoder.layers.8.mlp.linear_fc2.bias lr_decay_rate 0.18530201888518416name module.module.external_feature_model.vit.decoder.layers.8.ls1 lr_decay_rate 0.18530201888518416name module.module.external_feature_model.vit.decoder.layers.7.mlp.linear_fc1.bias lr_decay_rate 0.16677181699666577 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.self_attention.linear_proj.bias key (0.0, 0.016677181699666577, False, False)name module.module.external_feature_model.vit.decoder.layers.7.input_layernorm.weight lr_decay_rate 0.16677181699666577 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.mlp.linear_fc1.bias key (0.0, 0.018530201888518418, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.mlp.linear_fc2.bias key (0.0, 0.013508517176729929, False, False) name module.module.external_feature_model.vit.decoder.layers.8.pre_mlp_layernorm.weight lr_decay_rate 0.18530201888518416 name module.module.external_feature_model.vit.decoder.layers.12.mlp.linear_fc1.weight lr_decay_rate 0.2824295364810001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.mlp.linear_fc2.bias key (0.0, 0.018530201888518418, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.mlp.linear_fc1.bias key (0.0, 0.016677181699666577, False, False) name module.module.external_feature_model.vit.decoder.layers.5.pre_mlp_layernorm.weight lr_decay_rate 0.13508517176729928_get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.ls1 key (0.0, 0.018530201888518418, False, False) name module.module.external_feature_model.vit.decoder.layers.7.self_attention.linear_qkv.weight lr_decay_rate 0.16677181699666577 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.input_layernorm.weight key (0.0, 0.016677181699666577, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.pre_mlp_layernorm.weight key (0.0, 0.018530201888518418, False, False) name module.module.external_feature_model.vit.decoder.layers.8.mlp.linear_fc2.weight lr_decay_rate 0.18530201888518416 name module.module.external_feature_model.vit.decoder.layers.6.ls1 lr_decay_rate 0.15009463529699918_get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.mlp.linear_fc1.weight key (1.0, 0.028242953648100012, False, False) name module.module.external_feature_model.vit.decoder.layers.7.mlp.linear_fc2.weight lr_decay_rate 0.16677181699666577name module.module.external_feature_model.vit.decoder.layers.9.ls1 lr_decay_rate 0.20589113209464907 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.pre_mlp_layernorm.weight key (0.0, 0.013508517176729929, False, False) name module.module.external_feature_model.vit.decoder.layers.7.input_layernorm.bias lr_decay_rate 0.16677181699666577_get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.self_attention.linear_qkv.weight key (1.0, 0.016677181699666577, False, False)name module.module.external_feature_model.vit.decoder.layers.8.pre_mlp_layernorm.bias lr_decay_rate 0.18530201888518416 name module.module.external_feature_model.vit.decoder.layers.8.ls2 lr_decay_rate 0.18530201888518416 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.mlp.linear_fc2.weight key (1.0, 0.018530201888518418, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.ls1 key (0.0, 0.015009463529699918, False, False) name module.module.external_feature_model.vit.decoder.layers.12.mlp.linear_fc1.bias lr_decay_rate 0.2824295364810001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.mlp.linear_fc2.weight key (1.0, 0.016677181699666577, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.ls1 key (0.0, 0.02058911320946491, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.input_layernorm.bias key (0.0, 0.016677181699666577, False, False) name module.module.external_feature_model.vit.decoder.layers.5.pre_mlp_layernorm.bias lr_decay_rate 0.13508517176729928_get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.pre_mlp_layernorm.bias key (0.0, 0.018530201888518418, False, False) name module.module.external_feature_model.vit.decoder.layers.7.self_attention.linear_qkv.bias lr_decay_rate 0.16677181699666577 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.ls2 key (0.0, 0.018530201888518418, False, False) name module.module.external_feature_model.vit.decoder.layers.8.mlp.linear_fc2.bias lr_decay_rate 0.18530201888518416_get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.mlp.linear_fc1.bias key (0.0, 0.028242953648100012, False, False) name module.module.external_feature_model.vit.decoder.layers.6.ls2 lr_decay_rate 0.15009463529699918 name module.module.external_feature_model.vit.decoder.layers.7.mlp.linear_fc2.bias lr_decay_rate 0.16677181699666577 name module.module.external_feature_model.vit.decoder.layers.9.ls2 lr_decay_rate 0.20589113209464907 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.self_attention.linear_qkv.bias key (0.0, 0.016677181699666577, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.pre_mlp_layernorm.bias key (0.0, 0.013508517176729929, False, False) name module.module.external_feature_model.vit.decoder.layers.8.mlp.linear_fc1.weight lr_decay_rate 0.18530201888518416name module.module.external_feature_model.vit.decoder.layers.7.self_attention.linear_proj.weight lr_decay_rate 0.16677181699666577_get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.mlp.linear_fc2.bias key (0.0, 0.018530201888518418, False, False) name module.module.external_feature_model.vit.decoder.layers.8.input_layernorm.weight lr_decay_rate 0.18530201888518416 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.ls2 key (0.0, 0.015009463529699918, False, False)name module.module.external_feature_model.vit.decoder.layers.12.mlp.linear_fc2.weight lr_decay_rate 0.2824295364810001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.mlp.linear_fc2.bias key (0.0, 0.016677181699666577, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.ls2 key (0.0, 0.02058911320946491, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.mlp.linear_fc1.weight key (1.0, 0.018530201888518418, False, False)name module.module.external_feature_model.vit.decoder.layers.5.mlp.linear_fc1.weight lr_decay_rate 0.13508517176729928 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.self_attention.linear_proj.weight key (1.0, 0.016677181699666577, False, False) name module.module.external_feature_model.vit.decoder.layers.7.pre_mlp_layernorm.weight lr_decay_rate 0.16677181699666577_get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.input_layernorm.weight key (0.0, 0.018530201888518418, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.mlp.linear_fc2.weight key (1.0, 0.028242953648100012, False, False)name module.module.external_feature_model.vit.decoder.layers.6.input_layernorm.weight lr_decay_rate 0.15009463529699918name module.module.external_feature_model.vit.decoder.layers.8.ls1 lr_decay_rate 0.18530201888518416 name module.module.external_feature_model.vit.decoder.layers.9.input_layernorm.weight lr_decay_rate 0.20589113209464907 name module.module.external_feature_model.vit.decoder.layers.8.mlp.linear_fc1.bias lr_decay_rate 0.18530201888518416name module.module.external_feature_model.vit.decoder.layers.9.ls1 lr_decay_rate 0.20589113209464907 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.mlp.linear_fc1.weight key (1.0, 0.013508517176729929, False, False)name module.module.external_feature_model.vit.decoder.layers.7.self_attention.linear_proj.bias lr_decay_rate 0.16677181699666577 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.pre_mlp_layernorm.weight key (0.0, 0.016677181699666577, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.input_layernorm.weight key (0.0, 0.015009463529699918, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.input_layernorm.weight key (0.0, 0.02058911320946491, False, False)name module.module.external_feature_model.vit.decoder.layers.8.input_layernorm.bias lr_decay_rate 0.18530201888518416name module.module.external_feature_model.vit.decoder.layers.12.mlp.linear_fc2.bias lr_decay_rate 0.2824295364810001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.ls1 key (0.0, 0.018530201888518418, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.mlp.linear_fc1.bias key (0.0, 0.018530201888518418, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.ls1 key (0.0, 0.02058911320946491, False, False)name module.module.external_feature_model.vit.decoder.layers.5.mlp.linear_fc1.bias lr_decay_rate 0.13508517176729928_get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.self_attention.linear_proj.bias key (0.0, 0.016677181699666577, False, False)name module.module.external_feature_model.vit.decoder.layers.7.pre_mlp_layernorm.bias lr_decay_rate 0.16677181699666577 name module.module.external_feature_model.vit.decoder.layers.6.input_layernorm.bias lr_decay_rate 0.15009463529699918 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.input_layernorm.bias key (0.0, 0.018530201888518418, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.mlp.linear_fc2.bias key (0.0, 0.028242953648100012, False, False)name module.module.external_feature_model.vit.decoder.layers.9.input_layernorm.bias lr_decay_rate 0.20589113209464907name module.module.external_feature_model.vit.decoder.layers.8.mlp.linear_fc2.weight lr_decay_rate 0.18530201888518416 name module.module.external_feature_model.vit.decoder.layers.8.ls2 lr_decay_rate 0.18530201888518416 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.input_layernorm.bias key (0.0, 0.015009463529699918, False, False) name module.module.external_feature_model.vit.decoder.layers.9.ls2 lr_decay_rate 0.20589113209464907_get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.pre_mlp_layernorm.bias key (0.0, 0.016677181699666577, False, False) name module.module.external_feature_model.vit.decoder.layers.7.self_attention.linear_qkv.weight lr_decay_rate 0.16677181699666577 name module.module.external_feature_model.vit.class_token lr_decay_rate 1.0_get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.mlp.linear_fc1.bias key (0.0, 0.013508517176729929, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.input_layernorm.bias key (0.0, 0.02058911320946491, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.ls2 key (0.0, 0.018530201888518418, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.mlp.linear_fc2.weight key (1.0, 0.018530201888518418, False, False) name module.module.external_feature_model.vit.decoder.layers.13.ls1 lr_decay_rate 0.31381059609000006 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.ls2 key (0.0, 0.02058911320946491, False, False)name module.module.external_feature_model.vit.decoder.layers.8.self_attention.linear_proj.weight lr_decay_rate 0.18530201888518416 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.self_attention.linear_qkv.weight key (1.0, 0.016677181699666577, False, False)name module.module.external_feature_model.vit.decoder.layers.7.mlp.linear_fc1.weight lr_decay_rate 0.16677181699666577 name module.module.external_feature_model.vit.decoder.layers.6.self_attention.linear_proj.weight lr_decay_rate 0.15009463529699918name module.module.external_feature_model.vit.decoder.layers.5.mlp.linear_fc2.weight lr_decay_rate 0.13508517176729928name module.module.external_feature_model.vit.decoder.layers.8.input_layernorm.weight lr_decay_rate 0.18530201888518416 name module.module.external_feature_model.vit.decoder.layers.8.mlp.linear_fc2.bias lr_decay_rate 0.18530201888518416 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.ls1 key (0.0, 0.031381059609000006, False, False) name module.module.external_feature_model.vit.decoder.layers.9.self_attention.linear_proj.weight lr_decay_rate 0.20589113209464907 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.self_attention.linear_proj.weight key (1.0, 0.018530201888518418, False, False)name module.module.external_feature_model.vit.decoder.layers.9.input_layernorm.weight lr_decay_rate 0.20589113209464907_get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.mlp.linear_fc1.weight key (1.0, 0.016677181699666577, False, False)name module.module.external_feature_model.vit.decoder.layers.7.self_attention.linear_qkv.bias lr_decay_rate 0.16677181699666577 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.self_attention.linear_proj.weight key (1.0, 0.015009463529699918, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.mlp.linear_fc2.weight key (1.0, 0.013508517176729929, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.input_layernorm.weight key (0.0, 0.018530201888518418, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.mlp.linear_fc2.bias key (0.0, 0.018530201888518418, False, False)name module.module.external_feature_model.vit.decoder.layers.13.ls2 lr_decay_rate 0.31381059609000006 name module.module.external_feature_model.vit.decoder.layers.7.mlp.linear_fc1.bias lr_decay_rate 0.16677181699666577_get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.self_attention.linear_proj.weight key (1.0, 0.02058911320946491, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.self_attention.linear_qkv.bias key (0.0, 0.016677181699666577, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.input_layernorm.weight key (0.0, 0.02058911320946491, False, False) name module.module.external_feature_model.vit.decoder.layers.8.self_attention.linear_proj.bias lr_decay_rate 0.18530201888518416 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.ls2 key (0.0, 0.031381059609000006, False, False)name module.module.external_feature_model.vit.decoder.layers.6.self_attention.linear_proj.bias lr_decay_rate 0.15009463529699918 name module.module.external_feature_model.vit.decoder.layers.5.mlp.linear_fc2.bias lr_decay_rate 0.13508517176729928name module.module.external_feature_model.vit.decoder.layers.8.input_layernorm.bias lr_decay_rate 0.18530201888518416 name module.module.external_feature_model.vit.decoder.layers.9.ls1 lr_decay_rate 0.20589113209464907 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.mlp.linear_fc1.bias key (0.0, 0.016677181699666577, False, False) name module.module.external_feature_model.vit.decoder.layers.9.self_attention.linear_proj.bias lr_decay_rate 0.20589113209464907 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.self_attention.linear_proj.bias key (0.0, 0.018530201888518418, False, False)name module.module.external_feature_model.vit.decoder.layers.9.input_layernorm.bias lr_decay_rate 0.20589113209464907 name module.module.external_feature_model.vit.decoder.layers.7.pre_mlp_layernorm.weight lr_decay_rate 0.16677181699666577name module.module.external_feature_model.vit.decoder.layers.13.input_layernorm.weight lr_decay_rate 0.31381059609000006 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.mlp.linear_fc2.bias key (0.0, 0.013508517176729929, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.self_attention.linear_proj.bias key (0.0, 0.015009463529699918, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.input_layernorm.bias key (0.0, 0.018530201888518418, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.ls1 key (0.0, 0.02058911320946491, False, False) name module.module.external_feature_model.vit.decoder.layers.7.mlp.linear_fc2.weight lr_decay_rate 0.16677181699666577_get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.self_attention.linear_proj.bias key (0.0, 0.02058911320946491, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.input_layernorm.bias key (0.0, 0.02058911320946491, False, False) name module.module.external_feature_model.vit.decoder.layers.8.self_attention.linear_qkv.weight lr_decay_rate 0.18530201888518416 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.pre_mlp_layernorm.weight key (0.0, 0.016677181699666577, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.input_layernorm.weight key (0.0, 0.031381059609000006, False, False) name module.module.external_feature_model.vit.decoder.layers.6.self_attention.linear_qkv.weight lr_decay_rate 0.15009463529699918name module.module.external_feature_model.vit.decoder.layers.6.ls1 lr_decay_rate 0.15009463529699918 name module.module.external_feature_model.vit.decoder.layers.9.ls2 lr_decay_rate 0.20589113209464907_get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.mlp.linear_fc2.weight key (1.0, 0.016677181699666577, False, False) name module.module.external_feature_model.vit.decoder.layers.8.self_attention.linear_proj.weight lr_decay_rate 0.18530201888518416_get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.self_attention.linear_qkv.weight key (1.0, 0.018530201888518418, False, False)name module.module.external_feature_model.vit.decoder.layers.9.self_attention.linear_qkv.weight lr_decay_rate 0.20589113209464907 name module.module.external_feature_model.vit.decoder.layers.7.pre_mlp_layernorm.bias lr_decay_rate 0.16677181699666577 name module.module.external_feature_model.vit.decoder.layers.13.input_layernorm.bias lr_decay_rate 0.31381059609000006name module.module.external_feature_model.vit.decoder.layers.9.self_attention.linear_proj.weight lr_decay_rate 0.20589113209464907 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.self_attention.linear_qkv.weight key (1.0, 0.015009463529699918, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.ls1 key (0.0, 0.015009463529699918, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.ls2 key (0.0, 0.02058911320946491, False, False) name module.module.external_feature_model.vit.decoder.layers.7.mlp.linear_fc2.bias lr_decay_rate 0.16677181699666577_get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.self_attention.linear_qkv.weight key (1.0, 0.02058911320946491, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.self_attention.linear_proj.weight key (1.0, 0.018530201888518418, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.pre_mlp_layernorm.bias key (0.0, 0.016677181699666577, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.input_layernorm.bias key (0.0, 0.031381059609000006, False, False)name module.module.external_feature_model.vit.decoder.layers.8.self_attention.linear_qkv.bias lr_decay_rate 0.18530201888518416 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.self_attention.linear_proj.weight key (1.0, 0.02058911320946491, False, False)name module.module.external_feature_model.vit.decoder.layers.6.ls2 lr_decay_rate 0.15009463529699918 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.mlp.linear_fc2.bias key (0.0, 0.016677181699666577, False, False) name module.module.external_feature_model.vit.decoder.layers.6.self_attention.linear_qkv.bias lr_decay_rate 0.15009463529699918name module.module.external_feature_model.vit.decoder.layers.9.input_layernorm.weight lr_decay_rate 0.20589113209464907name module.module.external_feature_model.vit.decoder.layers.9.self_attention.linear_qkv.bias lr_decay_rate 0.20589113209464907 name module.module.external_feature_model.vit.decoder.layers.8.self_attention.linear_proj.bias lr_decay_rate 0.18530201888518416_get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.self_attention.linear_qkv.bias key (0.0, 0.018530201888518418, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.ls2 key (0.0, 0.015009463529699918, False, False)name module.module.external_feature_model.vit.decoder.layers.7.mlp.linear_fc1.weight lr_decay_rate 0.16677181699666577name module.module.external_feature_model.vit.decoder.layers.9.self_attention.linear_proj.bias lr_decay_rate 0.20589113209464907name module.module.external_feature_model.vit.decoder.layers.13.self_attention.linear_proj.weight lr_decay_rate 0.31381059609000006 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.self_attention.linear_qkv.bias key (0.0, 0.015009463529699918, False, False) name module.module.external_feature_model.vit.decoder.layers.8.ls1 lr_decay_rate 0.18530201888518416_get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.self_attention.linear_qkv.bias key (0.0, 0.02058911320946491, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.input_layernorm.weight key (0.0, 0.02058911320946491, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.self_attention.linear_proj.bias key (0.0, 0.018530201888518418, False, False) _get_param_groups name module.module.external_feature_model.vit.class_token key (1.0, 0.1, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.mlp.linear_fc1.weight key (1.0, 0.016677181699666577, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.self_attention.linear_proj.bias key (0.0, 0.02058911320946491, False, False)name module.module.external_feature_model.vit.decoder.layers.8.pre_mlp_layernorm.weight lr_decay_rate 0.18530201888518416name module.module.external_feature_model.vit.decoder.layers.6.input_layernorm.weight lr_decay_rate 0.15009463529699918 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.self_attention.linear_proj.weight key (1.0, 0.031381059609000006, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.ls1 key (0.0, 0.018530201888518418, False, False)name module.module.external_feature_model.vit.decoder.layers.9.input_layernorm.bias lr_decay_rate 0.20589113209464907 name module.module.external_feature_model.vit.decoder.layers.8.self_attention.linear_qkv.weight lr_decay_rate 0.18530201888518416name module.module.external_feature_model.vit.decoder.layers.6.pre_mlp_layernorm.weight lr_decay_rate 0.15009463529699918 name module.module.external_feature_model.vit.decoder.layers.9.pre_mlp_layernorm.weight lr_decay_rate 0.20589113209464907 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.pre_mlp_layernorm.weight key (0.0, 0.018530201888518418, False, False)name module.module.external_feature_model.vit.decoder.layers.7.mlp.linear_fc1.bias lr_decay_rate 0.16677181699666577 name module.module.external_feature_model.vit.decoder.layers.13.self_attention.linear_proj.bias lr_decay_rate 0.31381059609000006 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.input_layernorm.bias key (0.0, 0.02058911320946491, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.input_layernorm.weight key (0.0, 0.015009463529699918, False, False)name module.module.external_feature_model.vit.decoder.layers.9.self_attention.linear_qkv.weight lr_decay_rate 0.20589113209464907_get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.self_attention.linear_qkv.weight key (1.0, 0.018530201888518418, False, False)name module.module.external_feature_model.vit.decoder.layers.8.ls2 lr_decay_rate 0.18530201888518416 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.pre_mlp_layernorm.weight key (0.0, 0.015009463529699918, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.pre_mlp_layernorm.weight key (0.0, 0.02058911320946491, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.mlp.linear_fc1.bias key (0.0, 0.016677181699666577, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.self_attention.linear_proj.bias key (0.0, 0.031381059609000006, False, False)name module.module.external_feature_model.vit.decoder.layers.8.pre_mlp_layernorm.bias lr_decay_rate 0.18530201888518416name module.module.external_feature_model.vit.conv1.weight lr_decay_rate 0.0717897987691853 name module.module.external_feature_model.vit.decoder.layers.8.self_attention.linear_qkv.bias lr_decay_rate 0.18530201888518416 name module.module.external_feature_model.vit.decoder.layers.6.input_layernorm.bias lr_decay_rate 0.15009463529699918 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.self_attention.linear_qkv.weight key (1.0, 0.02058911320946491, False, False)name module.module.external_feature_model.vit.decoder.layers.9.self_attention.linear_proj.weight lr_decay_rate 0.20589113209464907 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.ls2 key (0.0, 0.018530201888518418, False, False) name module.module.external_feature_model.vit.decoder.layers.6.pre_mlp_layernorm.bias lr_decay_rate 0.15009463529699918 name module.module.external_feature_model.vit.decoder.layers.9.pre_mlp_layernorm.bias lr_decay_rate 0.20589113209464907_get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.self_attention.linear_qkv.bias key (0.0, 0.018530201888518418, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.input_layernorm.bias key (0.0, 0.015009463529699918, False, False) name module.module.external_feature_model.vit.decoder.layers.7.mlp.linear_fc2.weight lr_decay_rate 0.16677181699666577_get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.pre_mlp_layernorm.bias key (0.0, 0.018530201888518418, False, False) name module.module.external_feature_model.vit.decoder.layers.13.self_attention.linear_qkv.weight lr_decay_rate 0.31381059609000006 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.pre_mlp_layernorm.bias key (0.0, 0.015009463529699918, False, False)name module.module.external_feature_model.vit.decoder.layers.8.input_layernorm.weight lr_decay_rate 0.18530201888518416 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.self_attention.linear_proj.weight key (1.0, 0.02058911320946491, False, False)_get_param_groups name module.module.external_feature_model.vit.conv1.weight key (1.0, 0.00717897987691853, False, False)name module.module.external_feature_model.vit.decoder.layers.9.self_attention.linear_qkv.bias lr_decay_rate 0.20589113209464907 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.pre_mlp_layernorm.bias key (0.0, 0.02058911320946491, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.mlp.linear_fc2.weight key (1.0, 0.016677181699666577, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.self_attention.linear_qkv.weight key (1.0, 0.031381059609000006, False, False)name module.module.external_feature_model.vit.decoder.layers.8.pre_mlp_layernorm.weight lr_decay_rate 0.18530201888518416 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.input_layernorm.weight key (0.0, 0.018530201888518418, False, False) name module.module.external_feature_model.vit.decoder.layers.8.mlp.linear_fc1.weight lr_decay_rate 0.18530201888518416name module.module.external_feature_model.vit.decoder.layers.6.self_attention.linear_proj.weight lr_decay_rate 0.15009463529699918 name module.module.external_feature_model.vit.decoder.layers.6.mlp.linear_fc1.weight lr_decay_rate 0.15009463529699918name module.module.external_feature_model.vit.decoder.layers.9.self_attention.linear_proj.bias lr_decay_rate 0.20589113209464907_get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.self_attention.linear_qkv.bias key (0.0, 0.02058911320946491, False, False)name module.module.external_feature_model.vit.decoder.layers.9.mlp.linear_fc1.weight lr_decay_rate 0.20589113209464907 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.pre_mlp_layernorm.weight key (0.0, 0.018530201888518418, False, False) name module.module.external_feature_model.vit.decoder.layers.7.mlp.linear_fc2.bias lr_decay_rate 0.16677181699666577 name module.module.external_feature_model.vit.conv1.bias lr_decay_rate 0.0717897987691853name module.module.external_feature_model.vit.decoder.layers.13.self_attention.linear_qkv.bias lr_decay_rate 0.31381059609000006 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.self_attention.linear_proj.weight key (1.0, 0.015009463529699918, False, False)name module.module.external_feature_model.vit.decoder.layers.8.input_layernorm.bias lr_decay_rate 0.18530201888518416 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.mlp.linear_fc1.weight key (1.0, 0.018530201888518418, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.mlp.linear_fc1.weight key (1.0, 0.015009463529699918, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.mlp.linear_fc1.weight key (1.0, 0.02058911320946491, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.self_attention.linear_proj.bias key (0.0, 0.02058911320946491, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.self_attention.linear_qkv.bias key (0.0, 0.031381059609000006, False, False) name module.module.external_feature_model.vit.decoder.layers.8.pre_mlp_layernorm.bias lr_decay_rate 0.18530201888518416 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.mlp.linear_fc2.bias key (0.0, 0.016677181699666577, False, False) _get_param_groups name module.module.external_feature_model.vit.conv1.bias key (0.0, 0.00717897987691853, False, False)name module.module.external_feature_model.vit.decoder.layers.9.pre_mlp_layernorm.weight lr_decay_rate 0.20589113209464907 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.input_layernorm.bias key (0.0, 0.018530201888518418, False, False) name module.module.external_feature_model.vit.decoder.layers.6.self_attention.linear_proj.bias lr_decay_rate 0.15009463529699918 name module.module.external_feature_model.vit.decoder.layers.8.mlp.linear_fc1.bias lr_decay_rate 0.18530201888518416 name module.module.external_feature_model.vit.decoder.layers.6.mlp.linear_fc1.bias lr_decay_rate 0.15009463529699918name module.module.external_feature_model.vit.decoder.layers.9.mlp.linear_fc1.bias lr_decay_rate 0.20589113209464907 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.pre_mlp_layernorm.bias key (0.0, 0.018530201888518418, False, False) name module.module.external_feature_model.vit.decoder.layers.9.self_attention.linear_qkv.weight lr_decay_rate 0.20589113209464907 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.pre_mlp_layernorm.weight key (0.0, 0.02058911320946491, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.self_attention.linear_proj.bias key (0.0, 0.015009463529699918, False, False)name module.module.external_feature_model.vit.decoder.layers.8.ls1 lr_decay_rate 0.18530201888518416_get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.mlp.linear_fc1.bias key (0.0, 0.018530201888518418, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.mlp.linear_fc1.bias key (0.0, 0.02058911320946491, False, False)name module.module.external_feature_model.vit.position_embeddings.weight lr_decay_rate 0.0717897987691853 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.mlp.linear_fc1.bias key (0.0, 0.015009463529699918, False, False)name module.module.external_feature_model.vit.decoder.layers.8.self_attention.linear_proj.weight lr_decay_rate 0.18530201888518416 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.self_attention.linear_qkv.weight key (1.0, 0.02058911320946491, False, False)name module.module.external_feature_model.vit.decoder.layers.8.mlp.linear_fc1.weight lr_decay_rate 0.18530201888518416 name module.module.external_feature_model.vit.decoder.layers.13.pre_mlp_layernorm.weight lr_decay_rate 0.31381059609000006 name module.module.external_feature_model.vit.decoder.layers.9.pre_mlp_layernorm.bias lr_decay_rate 0.20589113209464907 name module.module.external_feature_model.vit.decoder.layers.8.mlp.linear_fc2.weight lr_decay_rate 0.18530201888518416name module.module.external_feature_model.vit.decoder.layers.6.self_attention.linear_qkv.weight lr_decay_rate 0.15009463529699918 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.ls1 key (0.0, 0.018530201888518418, False, False)name module.module.external_feature_model.vit.decoder.layers.9.mlp.linear_fc2.weight lr_decay_rate 0.20589113209464907 _get_param_groups name module.module.external_feature_model.vit.position_embeddings.weight key (1.0, 0.00717897987691853, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.pre_mlp_layernorm.bias key (0.0, 0.02058911320946491, False, False)name module.module.external_feature_model.vit.decoder.layers.6.mlp.linear_fc2.weight lr_decay_rate 0.15009463529699918name module.module.external_feature_model.vit.decoder.layers.9.self_attention.linear_qkv.bias lr_decay_rate 0.20589113209464907 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.mlp.linear_fc1.weight key (1.0, 0.018530201888518418, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.self_attention.linear_proj.weight key (1.0, 0.018530201888518418, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.self_attention.linear_qkv.weight key (1.0, 0.015009463529699918, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.pre_mlp_layernorm.weight key (0.0, 0.031381059609000006, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.mlp.linear_fc2.weight key (1.0, 0.018530201888518418, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.mlp.linear_fc2.weight key (1.0, 0.02058911320946491, False, False) name module.module.external_feature_model.vit.decoder.layers.8.ls2 lr_decay_rate 0.18530201888518416 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.self_attention.linear_qkv.bias key (0.0, 0.02058911320946491, False, False) name module.module.external_feature_model.vit.decoder.layers.9.mlp.linear_fc1.weight lr_decay_rate 0.20589113209464907 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.mlp.linear_fc2.weight key (1.0, 0.015009463529699918, False, False) name module.module.external_feature_model.vit.class_token lr_decay_rate 1.0name module.module.external_feature_model.vit.decoder.layers.8.mlp.linear_fc1.bias lr_decay_rate 0.18530201888518416name module.module.external_feature_model.vit.decoder.layers.13.pre_mlp_layernorm.bias lr_decay_rate 0.31381059609000006 name module.module.external_feature_model.vit.decoder.layers.8.self_attention.linear_proj.bias lr_decay_rate 0.18530201888518416 name module.module.external_feature_model.vit.decoder.layers.6.self_attention.linear_qkv.bias lr_decay_rate 0.15009463529699918 name module.module.external_feature_model.vit.decoder.layers.8.mlp.linear_fc2.bias lr_decay_rate 0.18530201888518416name module.module.external_feature_model.vit.decoder.layers.6.mlp.linear_fc2.bias lr_decay_rate 0.15009463529699918name module.module.external_feature_model.vit.decoder.layers.9.mlp.linear_fc2.bias lr_decay_rate 0.20589113209464907 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.ls2 key (0.0, 0.018530201888518418, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.mlp.linear_fc1.weight key (1.0, 0.02058911320946491, False, False) name module.module.external_feature_model.vit.decoder.layers.0.ls1 lr_decay_rate 0.07976644307687256name module.module.external_feature_model.vit.decoder.layers.9.pre_mlp_layernorm.weight lr_decay_rate 0.20589113209464907 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.mlp.linear_fc1.bias key (0.0, 0.018530201888518418, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.pre_mlp_layernorm.bias key (0.0, 0.031381059609000006, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.self_attention.linear_proj.bias key (0.0, 0.018530201888518418, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.mlp.linear_fc2.bias key (0.0, 0.018530201888518418, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.mlp.linear_fc2.bias key (0.0, 0.015009463529699918, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.self_attention.linear_qkv.bias key (0.0, 0.015009463529699918, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.mlp.linear_fc2.bias key (0.0, 0.02058911320946491, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.pre_mlp_layernorm.weight key (0.0, 0.02058911320946491, False, False) name module.module.external_feature_model.vit.decoder.layers.8.input_layernorm.weight lr_decay_rate 0.18530201888518416name module.module.external_feature_model.vit.decoder.layers.9.mlp.linear_fc1.bias lr_decay_rate 0.20589113209464907 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.ls1 key (0.0, 0.007976644307687256, False, False)name module.module.external_feature_model.vit.decoder.layers.8.mlp.linear_fc2.weight lr_decay_rate 0.18530201888518416 name module.module.external_feature_model.vit.decoder.layers.8.self_attention.linear_qkv.weight lr_decay_rate 0.18530201888518416name module.module.external_feature_model.vit.decoder.layers.13.mlp.linear_fc1.weight lr_decay_rate 0.31381059609000006 name module.module.external_feature_model.vit.decoder.layers.9.ls1 lr_decay_rate 0.20589113209464907 name module.module.external_feature_model.vit.decoder.layers.7.ls1 lr_decay_rate 0.16677181699666577name module.module.external_feature_model.vit.decoder.layers.9.pre_mlp_layernorm.bias lr_decay_rate 0.20589113209464907_get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.input_layernorm.weight key (0.0, 0.018530201888518418, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.mlp.linear_fc1.bias key (0.0, 0.02058911320946491, False, False) name module.module.external_feature_model.vit.decoder.layers.10.ls1 lr_decay_rate 0.2287679245496101 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.mlp.linear_fc1.weight key (1.0, 0.031381059609000006, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.mlp.linear_fc2.weight key (1.0, 0.018530201888518418, False, False) name module.module.external_feature_model.vit.decoder.layers.6.pre_mlp_layernorm.weight lr_decay_rate 0.15009463529699918_get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.self_attention.linear_qkv.weight key (1.0, 0.018530201888518418, False, False) name module.module.external_feature_model.vit.decoder.layers.0.ls2 lr_decay_rate 0.07976644307687256name module.module.external_feature_model.vit.decoder.layers.8.input_layernorm.bias lr_decay_rate 0.18530201888518416_get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.ls1 key (0.0, 0.02058911320946491, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.ls1 key (0.0, 0.016677181699666577, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.pre_mlp_layernorm.bias key (0.0, 0.02058911320946491, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.ls1 key (0.0, 0.02287679245496101, False, False)name module.module.external_feature_model.vit.decoder.layers.8.mlp.linear_fc2.bias lr_decay_rate 0.18530201888518416 name module.module.external_feature_model.vit.decoder.layers.9.mlp.linear_fc2.weight lr_decay_rate 0.20589113209464907 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.pre_mlp_layernorm.weight key (0.0, 0.015009463529699918, False, False)name module.module.external_feature_model.vit.decoder.layers.13.mlp.linear_fc1.bias lr_decay_rate 0.31381059609000006 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.input_layernorm.bias key (0.0, 0.018530201888518418, False, False) name module.module.external_feature_model.vit.decoder.layers.8.self_attention.linear_qkv.bias lr_decay_rate 0.18530201888518416 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.ls2 key (0.0, 0.007976644307687256, False, False) name module.module.external_feature_model.vit.decoder.layers.9.ls2 lr_decay_rate 0.20589113209464907 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.mlp.linear_fc2.bias key (0.0, 0.018530201888518418, False, False) name module.module.external_feature_model.vit.decoder.layers.9.mlp.linear_fc1.weight lr_decay_rate 0.20589113209464907name module.module.external_feature_model.vit.decoder.layers.7.ls2 lr_decay_rate 0.16677181699666577 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.mlp.linear_fc2.weight key (1.0, 0.02058911320946491, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.mlp.linear_fc1.bias key (0.0, 0.031381059609000006, False, False) name module.module.external_feature_model.vit.decoder.layers.10.ls2 lr_decay_rate 0.2287679245496101_get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.self_attention.linear_qkv.bias key (0.0, 0.018530201888518418, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.ls2 key (0.0, 0.02058911320946491, False, False)name module.module.external_feature_model.vit.decoder.layers.6.pre_mlp_layernorm.bias lr_decay_rate 0.15009463529699918 name module.module.external_feature_model.vit.decoder.layers.8.self_attention.linear_proj.weight lr_decay_rate 0.18530201888518416name module.module.external_feature_model.vit.decoder.layers.0.input_layernorm.weight lr_decay_rate 0.07976644307687256 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.ls2 key (0.0, 0.016677181699666577, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.mlp.linear_fc1.weight key (1.0, 0.02058911320946491, False, False) name module.module.external_feature_model.vit.decoder.layers.9.ls1 lr_decay_rate 0.20589113209464907 name module.module.external_feature_model.vit.decoder.layers.9.mlp.linear_fc2.bias lr_decay_rate 0.20589113209464907 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.ls2 key (0.0, 0.02287679245496101, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.pre_mlp_layernorm.bias key (0.0, 0.015009463529699918, False, False) name module.module.external_feature_model.vit.decoder.layers.13.mlp.linear_fc2.weight lr_decay_rate 0.31381059609000006_get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.self_attention.linear_proj.weight key (1.0, 0.018530201888518418, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.input_layernorm.weight key (0.0, 0.007976644307687256, False, False) name module.module.external_feature_model.vit.decoder.layers.9.input_layernorm.weight lr_decay_rate 0.20589113209464907name module.module.external_feature_model.vit.decoder.layers.8.pre_mlp_layernorm.weight lr_decay_rate 0.18530201888518416 name module.module.external_feature_model.vit.decoder.layers.9.mlp.linear_fc1.bias lr_decay_rate 0.20589113209464907 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.mlp.linear_fc2.bias key (0.0, 0.02058911320946491, False, False)name module.module.external_feature_model.vit.decoder.layers.7.input_layernorm.weight lr_decay_rate 0.16677181699666577 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.ls1 key (0.0, 0.02058911320946491, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.mlp.linear_fc2.weight key (1.0, 0.031381059609000006, False, False)name module.module.external_feature_model.vit.decoder.layers.10.input_layernorm.weight lr_decay_rate 0.2287679245496101name module.module.external_feature_model.vit.decoder.layers.6.mlp.linear_fc1.weight lr_decay_rate 0.15009463529699918 name module.module.external_feature_model.vit.decoder.layers.0.input_layernorm.bias lr_decay_rate 0.07976644307687256name module.module.external_feature_model.vit.decoder.layers.8.self_attention.linear_proj.bias lr_decay_rate 0.18530201888518416 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.input_layernorm.weight key (0.0, 0.02058911320946491, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.pre_mlp_layernorm.weight key (0.0, 0.018530201888518418, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.mlp.linear_fc1.bias key (0.0, 0.02058911320946491, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.input_layernorm.weight key (0.0, 0.016677181699666577, False, False) name module.module.external_feature_model.vit.decoder.layers.9.ls2 lr_decay_rate 0.20589113209464907 name module.module.external_feature_model.vit.decoder.layers.10.ls1 lr_decay_rate 0.2287679245496101_get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.input_layernorm.weight key (0.0, 0.02287679245496101, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.mlp.linear_fc1.weight key (1.0, 0.015009463529699918, False, False) name module.module.external_feature_model.vit.decoder.layers.13.mlp.linear_fc2.bias lr_decay_rate 0.31381059609000006_get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.self_attention.linear_proj.bias key (0.0, 0.018530201888518418, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.input_layernorm.bias key (0.0, 0.007976644307687256, False, False) name module.module.external_feature_model.vit.decoder.layers.8.pre_mlp_layernorm.bias lr_decay_rate 0.18530201888518416 name module.module.external_feature_model.vit.decoder.layers.9.input_layernorm.bias lr_decay_rate 0.20589113209464907name module.module.external_feature_model.vit.decoder.layers.9.mlp.linear_fc2.weight lr_decay_rate 0.20589113209464907_get_param_groups name module.module.external_feature_model.vit.class_token key (1.0, 0.1, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.ls2 key (0.0, 0.02058911320946491, False, False)name module.module.external_feature_model.vit.decoder.layers.7.input_layernorm.bias lr_decay_rate 0.16677181699666577 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.ls1 key (0.0, 0.02287679245496101, False, False)name module.module.external_feature_model.vit.decoder.layers.10.input_layernorm.bias lr_decay_rate 0.2287679245496101_get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.mlp.linear_fc2.bias key (0.0, 0.031381059609000006, False, False) name module.module.external_feature_model.vit.decoder.layers.6.mlp.linear_fc1.bias lr_decay_rate 0.15009463529699918 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.input_layernorm.bias key (0.0, 0.016677181699666577, False, False)name module.module.external_feature_model.vit.decoder.layers.8.self_attention.linear_qkv.weight lr_decay_rate 0.18530201888518416_get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.mlp.linear_fc2.weight key (1.0, 0.02058911320946491, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.pre_mlp_layernorm.bias key (0.0, 0.018530201888518418, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.input_layernorm.bias key (0.0, 0.02058911320946491, False, False) name module.module.external_feature_model.vit.decoder.layers.0.self_attention.linear_proj.weight lr_decay_rate 0.07976644307687256 name module.module.external_feature_model.vit.decoder.layers.9.input_layernorm.weight lr_decay_rate 0.20589113209464907name module.module.external_feature_model.vit.decoder.layers.10.ls2 lr_decay_rate 0.2287679245496101 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.input_layernorm.bias key (0.0, 0.02287679245496101, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.mlp.linear_fc1.bias key (0.0, 0.015009463529699918, False, False) name module.module.external_feature_model.vit.decoder.layers.14.ls1 lr_decay_rate 0.3486784401000001name module.module.external_feature_model.vit.decoder.layers.9.mlp.linear_fc2.bias lr_decay_rate 0.20589113209464907_get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.self_attention.linear_qkv.weight key (1.0, 0.018530201888518418, False, False) name module.module.external_feature_model.vit.decoder.layers.8.mlp.linear_fc1.weight lr_decay_rate 0.18530201888518416name module.module.external_feature_model.vit.conv1.weight lr_decay_rate 0.0717897987691853 name module.module.external_feature_model.vit.decoder.layers.7.self_attention.linear_proj.weight lr_decay_rate 0.16677181699666577_get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.input_layernorm.weight key (0.0, 0.02058911320946491, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.self_attention.linear_proj.weight key (1.0, 0.007976644307687256, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.ls2 key (0.0, 0.02287679245496101, False, False) name module.module.external_feature_model.vit.decoder.layers.9.self_attention.linear_proj.weight lr_decay_rate 0.20589113209464907 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.mlp.linear_fc2.bias key (0.0, 0.02058911320946491, False, False) name module.module.external_feature_model.vit.decoder.layers.10.self_attention.linear_proj.weight lr_decay_rate 0.2287679245496101_get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.mlp.linear_fc1.weight key (1.0, 0.018530201888518418, False, False)name module.module.external_feature_model.vit.decoder.layers.8.self_attention.linear_qkv.bias lr_decay_rate 0.18530201888518416_get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.ls1 key (0.0, 0.03486784401000001, False, False) name module.module.external_feature_model.vit.decoder.layers.6.mlp.linear_fc2.weight lr_decay_rate 0.15009463529699918 name module.module.external_feature_model.vit.decoder.layers.9.input_layernorm.bias lr_decay_rate 0.20589113209464907_get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.self_attention.linear_proj.weight key (1.0, 0.016677181699666577, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.self_attention.linear_proj.weight key (1.0, 0.02058911320946491, False, False) name module.module.external_feature_model.vit.decoder.layers.0.self_attention.linear_proj.bias lr_decay_rate 0.07976644307687256_get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.self_attention.linear_qkv.bias key (0.0, 0.018530201888518418, False, False)_get_param_groups name module.module.external_feature_model.vit.conv1.weight key (1.0, 0.00717897987691853, False, False)name module.module.external_feature_model.vit.decoder.layers.10.input_layernorm.weight lr_decay_rate 0.2287679245496101 name module.module.external_feature_model.vit.decoder.layers.10.ls1 lr_decay_rate 0.2287679245496101name module.module.external_feature_model.vit.decoder.layers.8.mlp.linear_fc1.bias lr_decay_rate 0.18530201888518416_get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.self_attention.linear_proj.weight key (1.0, 0.02287679245496101, False, False)name module.module.external_feature_model.vit.decoder.layers.14.ls2 lr_decay_rate 0.3486784401000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.input_layernorm.bias key (0.0, 0.02058911320946491, False, False)name module.module.external_feature_model.vit.decoder.layers.7.self_attention.linear_proj.bias lr_decay_rate 0.16677181699666577 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.mlp.linear_fc2.weight key (1.0, 0.015009463529699918, False, False) name module.module.external_feature_model.vit.decoder.layers.9.self_attention.linear_proj.bias lr_decay_rate 0.20589113209464907 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.ls2 key (0.0, 0.03486784401000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.self_attention.linear_proj.bias key (0.0, 0.007976644307687256, False, False)name module.module.external_feature_model.vit.conv1.bias lr_decay_rate 0.0717897987691853_get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.input_layernorm.weight key (0.0, 0.02287679245496101, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.mlp.linear_fc1.bias key (0.0, 0.018530201888518418, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.ls1 key (0.0, 0.02287679245496101, False, False) name module.module.external_feature_model.vit.decoder.layers.8.pre_mlp_layernorm.weight lr_decay_rate 0.18530201888518416 name module.module.external_feature_model.vit.decoder.layers.10.self_attention.linear_proj.bias lr_decay_rate 0.2287679245496101_get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.self_attention.linear_proj.bias key (0.0, 0.02058911320946491, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.self_attention.linear_proj.bias key (0.0, 0.016677181699666577, False, False) name module.module.external_feature_model.vit.decoder.layers.6.mlp.linear_fc2.bias lr_decay_rate 0.15009463529699918 name module.module.external_feature_model.vit.decoder.layers.9.self_attention.linear_proj.weight lr_decay_rate 0.20589113209464907_get_param_groups name module.module.external_feature_model.vit.conv1.bias key (0.0, 0.00717897987691853, False, False) name module.module.external_feature_model.vit.decoder.layers.14.input_layernorm.weight lr_decay_rate 0.3486784401000001name module.module.external_feature_model.vit.decoder.layers.10.input_layernorm.bias lr_decay_rate 0.2287679245496101_get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.pre_mlp_layernorm.weight key (0.0, 0.018530201888518418, False, False) name module.module.external_feature_model.vit.decoder.layers.0.self_attention.linear_qkv.weight lr_decay_rate 0.07976644307687256 name module.module.external_feature_model.vit.decoder.layers.8.mlp.linear_fc2.weight lr_decay_rate 0.18530201888518416name module.module.external_feature_model.vit.decoder.layers.10.ls2 lr_decay_rate 0.2287679245496101 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.self_attention.linear_proj.bias key (0.0, 0.02287679245496101, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.mlp.linear_fc2.bias key (0.0, 0.015009463529699918, False, False)name module.module.external_feature_model.vit.decoder.layers.9.self_attention.linear_qkv.weight lr_decay_rate 0.20589113209464907name module.module.external_feature_model.vit.decoder.layers.7.self_attention.linear_qkv.weight lr_decay_rate 0.16677181699666577 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.self_attention.linear_proj.weight key (1.0, 0.02058911320946491, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.input_layernorm.weight key (0.0, 0.03486784401000001, False, False)name module.module.external_feature_model.vit.decoder.layers.8.pre_mlp_layernorm.bias lr_decay_rate 0.18530201888518416_get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.input_layernorm.bias key (0.0, 0.02287679245496101, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.self_attention.linear_qkv.weight key (1.0, 0.007976644307687256, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.ls2 key (0.0, 0.02287679245496101, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.mlp.linear_fc2.weight key (1.0, 0.018530201888518418, False, False) name module.module.external_feature_model.vit.position_embeddings.weight lr_decay_rate 0.0717897987691853_get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.self_attention.linear_qkv.weight key (1.0, 0.02058911320946491, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.self_attention.linear_qkv.weight key (1.0, 0.016677181699666577, False, False) name module.module.external_feature_model.vit.decoder.layers.10.self_attention.linear_qkv.weight lr_decay_rate 0.2287679245496101 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.pre_mlp_layernorm.bias key (0.0, 0.018530201888518418, False, False) name module.module.external_feature_model.vit.decoder.layers.7.ls1 lr_decay_rate 0.16677181699666577name module.module.external_feature_model.vit.decoder.layers.14.input_layernorm.bias lr_decay_rate 0.3486784401000001name module.module.external_feature_model.vit.decoder.layers.9.self_attention.linear_proj.bias lr_decay_rate 0.20589113209464907 name module.module.external_feature_model.vit.decoder.layers.8.mlp.linear_fc2.bias lr_decay_rate 0.18530201888518416 name module.module.external_feature_model.vit.decoder.layers.0.self_attention.linear_qkv.bias lr_decay_rate 0.07976644307687256_get_param_groups name module.module.external_feature_model.vit.position_embeddings.weight key (1.0, 0.00717897987691853, False, False) name module.module.external_feature_model.vit.decoder.layers.10.input_layernorm.weight lr_decay_rate 0.2287679245496101name module.module.external_feature_model.vit.decoder.layers.9.self_attention.linear_qkv.bias lr_decay_rate 0.20589113209464907 name module.module.external_feature_model.vit.decoder.layers.10.self_attention.linear_proj.weight lr_decay_rate 0.2287679245496101_get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.self_attention.linear_qkv.weight key (1.0, 0.02287679245496101, False, False) name module.module.external_feature_model.vit.decoder.layers.7.self_attention.linear_qkv.bias lr_decay_rate 0.16677181699666577 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.input_layernorm.bias key (0.0, 0.03486784401000001, False, False)name module.module.external_feature_model.vit.decoder.layers.8.mlp.linear_fc1.weight lr_decay_rate 0.18530201888518416_get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.ls1 key (0.0, 0.016677181699666577, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.self_attention.linear_proj.bias key (0.0, 0.02058911320946491, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.self_attention.linear_qkv.bias key (0.0, 0.007976644307687256, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.mlp.linear_fc2.bias key (0.0, 0.018530201888518418, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.input_layernorm.weight key (0.0, 0.02287679245496101, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.self_attention.linear_qkv.bias key (0.0, 0.02058911320946491, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.self_attention.linear_proj.weight key (1.0, 0.02287679245496101, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.self_attention.linear_qkv.bias key (0.0, 0.016677181699666577, False, False) name module.module.external_feature_model.vit.decoder.layers.10.self_attention.linear_qkv.bias lr_decay_rate 0.2287679245496101 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.mlp.linear_fc1.weight key (1.0, 0.018530201888518418, False, False) name module.module.external_feature_model.vit.decoder.layers.7.ls2 lr_decay_rate 0.16677181699666577 name module.module.external_feature_model.vit.decoder.layers.0.ls1 lr_decay_rate 0.07976644307687256name module.module.external_feature_model.vit.decoder.layers.14.self_attention.linear_proj.weight lr_decay_rate 0.3486784401000001name module.module.external_feature_model.vit.decoder.layers.10.input_layernorm.bias lr_decay_rate 0.2287679245496101 name module.module.external_feature_model.vit.decoder.layers.9.self_attention.linear_qkv.weight lr_decay_rate 0.20589113209464907 name module.module.external_feature_model.vit.decoder.layers.9.ls1 lr_decay_rate 0.20589113209464907 name module.module.external_feature_model.vit.decoder.layers.10.self_attention.linear_proj.bias lr_decay_rate 0.2287679245496101name module.module.external_feature_model.vit.decoder.layers.0.pre_mlp_layernorm.weight lr_decay_rate 0.07976644307687256 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.ls2 key (0.0, 0.016677181699666577, False, False)name module.module.external_feature_model.vit.decoder.layers.9.pre_mlp_layernorm.weight lr_decay_rate 0.20589113209464907_get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.self_attention.linear_qkv.bias key (0.0, 0.02287679245496101, False, False) name module.module.external_feature_model.vit.decoder.layers.8.mlp.linear_fc1.bias lr_decay_rate 0.18530201888518416name module.module.external_feature_model.vit.decoder.layers.7.pre_mlp_layernorm.weight lr_decay_rate 0.16677181699666577 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.input_layernorm.bias key (0.0, 0.02287679245496101, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.ls1 key (0.0, 0.007976644307687256, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.self_attention.linear_proj.weight key (1.0, 0.03486784401000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.self_attention.linear_qkv.weight key (1.0, 0.02058911320946491, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.ls1 key (0.0, 0.02058911320946491, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.self_attention.linear_proj.bias key (0.0, 0.02287679245496101, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.pre_mlp_layernorm.weight key (0.0, 0.007976644307687256, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.pre_mlp_layernorm.weight key (0.0, 0.02058911320946491, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.mlp.linear_fc1.bias key (0.0, 0.018530201888518418, False, False)name module.module.external_feature_model.vit.decoder.layers.7.input_layernorm.weight lr_decay_rate 0.16677181699666577 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.pre_mlp_layernorm.weight key (0.0, 0.016677181699666577, False, False) name module.module.external_feature_model.vit.decoder.layers.9.self_attention.linear_qkv.bias lr_decay_rate 0.20589113209464907name module.module.external_feature_model.vit.decoder.layers.14.self_attention.linear_proj.bias lr_decay_rate 0.3486784401000001 name module.module.external_feature_model.vit.decoder.layers.10.pre_mlp_layernorm.weight lr_decay_rate 0.2287679245496101name module.module.external_feature_model.vit.decoder.layers.0.ls2 lr_decay_rate 0.07976644307687256name module.module.external_feature_model.vit.decoder.layers.9.ls2 lr_decay_rate 0.20589113209464907 name module.module.external_feature_model.vit.decoder.layers.0.pre_mlp_layernorm.bias lr_decay_rate 0.07976644307687256 name module.module.external_feature_model.vit.decoder.layers.10.self_attention.linear_qkv.weight lr_decay_rate 0.2287679245496101name module.module.external_feature_model.vit.decoder.layers.10.self_attention.linear_proj.weight lr_decay_rate 0.2287679245496101 name module.module.external_feature_model.vit.decoder.layers.9.pre_mlp_layernorm.bias lr_decay_rate 0.20589113209464907 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.input_layernorm.weight key (0.0, 0.016677181699666577, False, False)name module.module.external_feature_model.vit.decoder.layers.8.mlp.linear_fc2.weight lr_decay_rate 0.18530201888518416_get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.self_attention.linear_qkv.bias key (0.0, 0.02058911320946491, False, False)name module.module.external_feature_model.vit.decoder.layers.7.pre_mlp_layernorm.bias lr_decay_rate 0.16677181699666577 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.self_attention.linear_proj.bias key (0.0, 0.03486784401000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.pre_mlp_layernorm.bias key (0.0, 0.007976644307687256, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.ls2 key (0.0, 0.02058911320946491, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.pre_mlp_layernorm.weight key (0.0, 0.02287679245496101, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.ls2 key (0.0, 0.007976644307687256, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.self_attention.linear_qkv.weight key (1.0, 0.02287679245496101, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.pre_mlp_layernorm.bias key (0.0, 0.016677181699666577, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.pre_mlp_layernorm.bias key (0.0, 0.02058911320946491, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.self_attention.linear_proj.weight key (1.0, 0.02287679245496101, False, False) name module.module.external_feature_model.vit.decoder.layers.7.input_layernorm.bias lr_decay_rate 0.16677181699666577_get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.mlp.linear_fc2.weight key (1.0, 0.018530201888518418, False, False) name module.module.external_feature_model.vit.decoder.layers.10.pre_mlp_layernorm.bias lr_decay_rate 0.2287679245496101 name module.module.external_feature_model.vit.decoder.layers.9.pre_mlp_layernorm.weight lr_decay_rate 0.20589113209464907 name module.module.external_feature_model.vit.decoder.layers.10.self_attention.linear_qkv.bias lr_decay_rate 0.2287679245496101name module.module.external_feature_model.vit.decoder.layers.14.self_attention.linear_qkv.weight lr_decay_rate 0.3486784401000001 name module.module.external_feature_model.vit.decoder.layers.9.input_layernorm.weight lr_decay_rate 0.20589113209464907 name module.module.external_feature_model.vit.decoder.layers.0.mlp.linear_fc1.weight lr_decay_rate 0.07976644307687256 name module.module.external_feature_model.vit.decoder.layers.0.input_layernorm.weight lr_decay_rate 0.07976644307687256name module.module.external_feature_model.vit.decoder.layers.7.mlp.linear_fc1.weight lr_decay_rate 0.16677181699666577name module.module.external_feature_model.vit.decoder.layers.8.mlp.linear_fc2.bias lr_decay_rate 0.18530201888518416_get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.input_layernorm.bias key (0.0, 0.016677181699666577, False, False)name module.module.external_feature_model.vit.decoder.layers.9.mlp.linear_fc1.weight lr_decay_rate 0.20589113209464907name module.module.external_feature_model.vit.decoder.layers.10.self_attention.linear_proj.bias lr_decay_rate 0.2287679245496101 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.self_attention.linear_qkv.bias key (0.0, 0.02287679245496101, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.self_attention.linear_qkv.weight key (1.0, 0.03486784401000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.pre_mlp_layernorm.bias key (0.0, 0.02287679245496101, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.mlp.linear_fc1.weight key (1.0, 0.007976644307687256, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.pre_mlp_layernorm.weight key (0.0, 0.02058911320946491, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.input_layernorm.weight key (0.0, 0.02058911320946491, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.input_layernorm.weight key (0.0, 0.007976644307687256, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.mlp.linear_fc1.weight key (1.0, 0.02058911320946491, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.mlp.linear_fc2.bias key (0.0, 0.018530201888518418, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.self_attention.linear_proj.bias key (0.0, 0.02287679245496101, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.mlp.linear_fc1.weight key (1.0, 0.016677181699666577, False, False) name module.module.external_feature_model.vit.decoder.layers.9.input_layernorm.bias lr_decay_rate 0.20589113209464907name module.module.external_feature_model.vit.decoder.layers.14.self_attention.linear_qkv.bias lr_decay_rate 0.3486784401000001 name module.module.external_feature_model.vit.decoder.layers.0.mlp.linear_fc1.bias lr_decay_rate 0.07976644307687256name module.module.external_feature_model.vit.decoder.layers.9.pre_mlp_layernorm.bias lr_decay_rate 0.20589113209464907 name module.module.external_feature_model.vit.decoder.layers.10.mlp.linear_fc1.weight lr_decay_rate 0.2287679245496101 name module.module.external_feature_model.vit.decoder.layers.7.self_attention.linear_proj.weight lr_decay_rate 0.16677181699666577name module.module.external_feature_model.vit.decoder.layers.10.pre_mlp_layernorm.weight lr_decay_rate 0.2287679245496101name module.module.external_feature_model.vit.decoder.layers.0.input_layernorm.bias lr_decay_rate 0.07976644307687256name module.module.external_feature_model.vit.decoder.layers.9.mlp.linear_fc1.bias lr_decay_rate 0.20589113209464907 name module.module.external_feature_model.vit.decoder.layers.9.ls1 lr_decay_rate 0.20589113209464907 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.input_layernorm.bias key (0.0, 0.02058911320946491, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.self_attention.linear_qkv.bias key (0.0, 0.03486784401000001, False, False)name module.module.external_feature_model.vit.decoder.layers.10.self_attention.linear_qkv.weight lr_decay_rate 0.2287679245496101 name module.module.external_feature_model.vit.decoder.layers.7.mlp.linear_fc1.bias lr_decay_rate 0.16677181699666577_get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.mlp.linear_fc1.bias key (0.0, 0.007976644307687256, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.pre_mlp_layernorm.bias key (0.0, 0.02058911320946491, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.input_layernorm.bias key (0.0, 0.007976644307687256, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.mlp.linear_fc1.weight key (1.0, 0.02287679245496101, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.self_attention.linear_proj.weight key (1.0, 0.016677181699666577, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.pre_mlp_layernorm.weight key (0.0, 0.02287679245496101, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.mlp.linear_fc1.bias key (0.0, 0.02058911320946491, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.ls1 key (0.0, 0.02058911320946491, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.self_attention.linear_qkv.weight key (1.0, 0.02287679245496101, False, False) name module.module.external_feature_model.vit.decoder.layers.0.mlp.linear_fc2.weight lr_decay_rate 0.07976644307687256_get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.mlp.linear_fc1.bias key (0.0, 0.016677181699666577, False, False) name module.module.external_feature_model.vit.decoder.layers.10.mlp.linear_fc1.bias lr_decay_rate 0.2287679245496101name module.module.external_feature_model.vit.decoder.layers.14.pre_mlp_layernorm.weight lr_decay_rate 0.3486784401000001 name module.module.external_feature_model.vit.decoder.layers.9.self_attention.linear_proj.weight lr_decay_rate 0.20589113209464907 name module.module.external_feature_model.vit.decoder.layers.9.mlp.linear_fc1.weight lr_decay_rate 0.20589113209464907name module.module.external_feature_model.vit.decoder.layers.7.self_attention.linear_proj.bias lr_decay_rate 0.16677181699666577name module.module.external_feature_model.vit.decoder.layers.0.self_attention.linear_proj.weight lr_decay_rate 0.07976644307687256 name module.module.external_feature_model.vit.decoder.layers.10.pre_mlp_layernorm.bias lr_decay_rate 0.2287679245496101 name module.module.external_feature_model.vit.decoder.layers.9.mlp.linear_fc2.weight lr_decay_rate 0.20589113209464907_get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.mlp.linear_fc1.bias key (0.0, 0.02287679245496101, False, False)name module.module.external_feature_model.vit.decoder.layers.9.ls2 lr_decay_rate 0.20589113209464907_get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.mlp.linear_fc2.weight key (1.0, 0.007976644307687256, False, False)name module.module.external_feature_model.vit.decoder.layers.10.self_attention.linear_qkv.bias lr_decay_rate 0.2287679245496101 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.mlp.linear_fc1.weight key (1.0, 0.02058911320946491, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.self_attention.linear_proj.weight key (1.0, 0.02058911320946491, False, False)name module.module.external_feature_model.vit.decoder.layers.7.mlp.linear_fc2.weight lr_decay_rate 0.16677181699666577_get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.pre_mlp_layernorm.weight key (0.0, 0.03486784401000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.self_attention.linear_proj.weight key (1.0, 0.007976644307687256, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.self_attention.linear_proj.bias key (0.0, 0.016677181699666577, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.pre_mlp_layernorm.bias key (0.0, 0.02287679245496101, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.mlp.linear_fc2.weight key (1.0, 0.02058911320946491, False, False) name module.module.external_feature_model.vit.decoder.layers.10.mlp.linear_fc2.weight lr_decay_rate 0.2287679245496101_get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.self_attention.linear_qkv.bias key (0.0, 0.02287679245496101, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.ls2 key (0.0, 0.02058911320946491, False, False)name module.module.external_feature_model.vit.decoder.layers.0.mlp.linear_fc2.bias lr_decay_rate 0.07976644307687256 name module.module.external_feature_model.vit.decoder.layers.9.mlp.linear_fc1.bias lr_decay_rate 0.20589113209464907 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.mlp.linear_fc2.weight key (1.0, 0.016677181699666577, False, False)name module.module.external_feature_model.vit.decoder.layers.9.self_attention.linear_proj.bias lr_decay_rate 0.20589113209464907 name module.module.external_feature_model.vit.decoder.layers.14.pre_mlp_layernorm.bias lr_decay_rate 0.3486784401000001 name module.module.external_feature_model.vit.decoder.layers.9.mlp.linear_fc2.bias lr_decay_rate 0.20589113209464907name module.module.external_feature_model.vit.decoder.layers.0.self_attention.linear_proj.bias lr_decay_rate 0.07976644307687256 name module.module.external_feature_model.vit.decoder.layers.7.self_attention.linear_qkv.weight lr_decay_rate 0.16677181699666577name module.module.external_feature_model.vit.decoder.layers.10.mlp.linear_fc1.weight lr_decay_rate 0.2287679245496101_get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.mlp.linear_fc2.weight key (1.0, 0.02287679245496101, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.mlp.linear_fc2.bias key (0.0, 0.007976644307687256, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.mlp.linear_fc1.bias key (0.0, 0.02058911320946491, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.self_attention.linear_proj.bias key (0.0, 0.02058911320946491, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.self_attention.linear_proj.bias key (0.0, 0.007976644307687256, False, False)name module.module.external_feature_model.vit.decoder.layers.9.input_layernorm.weight lr_decay_rate 0.20589113209464907_get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.pre_mlp_layernorm.bias key (0.0, 0.03486784401000001, False, False)name module.module.external_feature_model.vit.decoder.layers.7.mlp.linear_fc2.bias lr_decay_rate 0.16677181699666577 name module.module.external_feature_model.vit.decoder.layers.10.pre_mlp_layernorm.weight lr_decay_rate 0.2287679245496101_get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.mlp.linear_fc2.bias key (0.0, 0.02058911320946491, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.self_attention.linear_qkv.weight key (1.0, 0.016677181699666577, False, False) name module.module.external_feature_model.vit.decoder.layers.9.mlp.linear_fc2.weight lr_decay_rate 0.20589113209464907 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.mlp.linear_fc1.weight key (1.0, 0.02287679245496101, False, False)name module.module.external_feature_model.vit.decoder.layers.10.mlp.linear_fc2.bias lr_decay_rate 0.2287679245496101name module.module.external_feature_model.vit.decoder.layers.1.ls1 lr_decay_rate 0.08862938119652507 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.input_layernorm.weight key (0.0, 0.02058911320946491, False, False)name module.module.external_feature_model.vit.decoder.layers.9.self_attention.linear_qkv.weight lr_decay_rate 0.20589113209464907name module.module.external_feature_model.vit.decoder.layers.14.mlp.linear_fc1.weight lr_decay_rate 0.3486784401000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.mlp.linear_fc2.bias key (0.0, 0.016677181699666577, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.pre_mlp_layernorm.weight key (0.0, 0.02287679245496101, False, False)name module.module.external_feature_model.vit.decoder.layers.7.self_attention.linear_qkv.bias lr_decay_rate 0.16677181699666577 name module.module.external_feature_model.vit.decoder.layers.0.self_attention.linear_qkv.weight lr_decay_rate 0.07976644307687256 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.mlp.linear_fc2.weight key (1.0, 0.02058911320946491, False, False)name module.module.external_feature_model.vit.decoder.layers.10.mlp.linear_fc1.bias lr_decay_rate 0.2287679245496101_get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.mlp.linear_fc2.bias key (0.0, 0.02287679245496101, False, False) name module.module.external_feature_model.vit.decoder.layers.9.input_layernorm.bias lr_decay_rate 0.20589113209464907name module.module.external_feature_model.vit.decoder.layers.10.ls1 lr_decay_rate 0.2287679245496101_get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.ls1 key (0.0, 0.008862938119652507, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.self_attention.linear_qkv.weight key (1.0, 0.02058911320946491, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.mlp.linear_fc1.weight key (1.0, 0.03486784401000001, False, False) name module.module.external_feature_model.vit.decoder.layers.10.pre_mlp_layernorm.bias lr_decay_rate 0.2287679245496101 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.self_attention.linear_qkv.bias key (0.0, 0.016677181699666577, False, False)name module.module.external_feature_model.vit.decoder.layers.8.ls1 lr_decay_rate 0.18530201888518416 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.mlp.linear_fc1.bias key (0.0, 0.02287679245496101, False, False)name module.module.external_feature_model.vit.decoder.layers.9.mlp.linear_fc2.bias lr_decay_rate 0.20589113209464907 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.self_attention.linear_qkv.weight key (1.0, 0.007976644307687256, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.ls1 key (0.0, 0.02287679245496101, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.input_layernorm.bias key (0.0, 0.02058911320946491, False, False) name module.module.external_feature_model.vit.decoder.layers.14.mlp.linear_fc1.bias lr_decay_rate 0.3486784401000001name module.module.external_feature_model.vit.decoder.layers.11.ls1 lr_decay_rate 0.2541865828329001 name module.module.external_feature_model.vit.decoder.layers.1.ls2 lr_decay_rate 0.08862938119652507 name module.module.external_feature_model.vit.decoder.layers.9.self_attention.linear_qkv.bias lr_decay_rate 0.20589113209464907 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.ls1 key (0.0, 0.018530201888518418, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.pre_mlp_layernorm.bias key (0.0, 0.02287679245496101, False, False)name module.module.external_feature_model.vit.decoder.layers.10.mlp.linear_fc2.weight lr_decay_rate 0.2287679245496101_get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.mlp.linear_fc2.bias key (0.0, 0.02058911320946491, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.mlp.linear_fc1.bias key (0.0, 0.03486784401000001, False, False) name module.module.external_feature_model.vit.decoder.layers.7.pre_mlp_layernorm.weight lr_decay_rate 0.16677181699666577name module.module.external_feature_model.vit.decoder.layers.0.self_attention.linear_qkv.bias lr_decay_rate 0.07976644307687256name module.module.external_feature_model.vit.decoder.layers.10.ls2 lr_decay_rate 0.2287679245496101_get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.ls2 key (0.0, 0.008862938119652507, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.mlp.linear_fc2.weight key (1.0, 0.02287679245496101, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.ls1 key (0.0, 0.02541865828329001, False, False)name module.module.external_feature_model.vit.decoder.layers.10.mlp.linear_fc1.weight lr_decay_rate 0.2287679245496101 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.self_attention.linear_qkv.bias key (0.0, 0.02058911320946491, False, False)name module.module.external_feature_model.vit.decoder.layers.9.self_attention.linear_proj.weight lr_decay_rate 0.20589113209464907 name module.module.external_feature_model.vit.decoder.layers.14.mlp.linear_fc2.weight lr_decay_rate 0.3486784401000001 name module.module.external_feature_model.vit.decoder.layers.8.ls2 lr_decay_rate 0.18530201888518416 name module.module.external_feature_model.vit.decoder.layers.10.ls1 lr_decay_rate 0.2287679245496101_get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.ls2 key (0.0, 0.02287679245496101, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.self_attention.linear_qkv.bias key (0.0, 0.007976644307687256, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.pre_mlp_layernorm.weight key (0.0, 0.016677181699666577, False, False)name module.module.external_feature_model.vit.decoder.layers.10.mlp.linear_fc2.bias lr_decay_rate 0.2287679245496101 name module.module.external_feature_model.vit.decoder.layers.1.input_layernorm.weight lr_decay_rate 0.08862938119652507_get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.self_attention.linear_proj.weight key (1.0, 0.02058911320946491, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.mlp.linear_fc1.weight key (1.0, 0.02287679245496101, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.mlp.linear_fc2.weight key (1.0, 0.03486784401000001, False, False) name module.module.external_feature_model.vit.decoder.layers.11.ls2 lr_decay_rate 0.2541865828329001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.ls1 key (0.0, 0.02287679245496101, False, False) name module.module.external_feature_model.vit.decoder.layers.9.pre_mlp_layernorm.weight lr_decay_rate 0.20589113209464907_get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.ls2 key (0.0, 0.018530201888518418, False, False) name module.module.external_feature_model.vit.decoder.layers.10.input_layernorm.weight lr_decay_rate 0.2287679245496101_get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.mlp.linear_fc2.bias key (0.0, 0.02287679245496101, False, False) name module.module.external_feature_model.vit.decoder.layers.7.pre_mlp_layernorm.bias lr_decay_rate 0.16677181699666577 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.input_layernorm.weight key (0.0, 0.008862938119652507, False, False) name module.module.external_feature_model.vit.decoder.layers.9.self_attention.linear_proj.bias lr_decay_rate 0.20589113209464907name module.module.external_feature_model.vit.decoder.layers.0.pre_mlp_layernorm.weight lr_decay_rate 0.07976644307687256name module.module.external_feature_model.vit.decoder.layers.14.mlp.linear_fc2.bias lr_decay_rate 0.3486784401000001name module.module.external_feature_model.vit.decoder.layers.10.mlp.linear_fc1.bias lr_decay_rate 0.2287679245496101_get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.ls2 key (0.0, 0.02541865828329001, False, False) name module.module.external_feature_model.vit.decoder.layers.10.ls2 lr_decay_rate 0.2287679245496101_get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.pre_mlp_layernorm.bias key (0.0, 0.016677181699666577, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.pre_mlp_layernorm.weight key (0.0, 0.02058911320946491, False, False)name module.module.external_feature_model.vit.decoder.layers.8.input_layernorm.weight lr_decay_rate 0.18530201888518416name module.module.external_feature_model.vit.decoder.layers.1.input_layernorm.bias lr_decay_rate 0.08862938119652507 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.input_layernorm.weight key (0.0, 0.02287679245496101, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.pre_mlp_layernorm.weight key (0.0, 0.007976644307687256, False, False)name module.module.external_feature_model.vit.decoder.layers.11.ls1 lr_decay_rate 0.2541865828329001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.mlp.linear_fc1.bias key (0.0, 0.02287679245496101, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.self_attention.linear_proj.bias key (0.0, 0.02058911320946491, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.mlp.linear_fc2.bias key (0.0, 0.03486784401000001, False, False) name module.module.external_feature_model.vit.decoder.layers.11.input_layernorm.weight lr_decay_rate 0.2541865828329001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.ls2 key (0.0, 0.02287679245496101, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.input_layernorm.weight key (0.0, 0.018530201888518418, False, False) name module.module.external_feature_model.vit.decoder.layers.9.pre_mlp_layernorm.bias lr_decay_rate 0.20589113209464907_get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.input_layernorm.bias key (0.0, 0.008862938119652507, False, False)name module.module.external_feature_model.vit.decoder.layers.10.input_layernorm.bias lr_decay_rate 0.2287679245496101 name module.module.external_feature_model.vit.decoder.layers.7.mlp.linear_fc1.weight lr_decay_rate 0.16677181699666577 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.ls1 key (0.0, 0.02541865828329001, False, False)name module.module.external_feature_model.vit.decoder.layers.0.pre_mlp_layernorm.bias lr_decay_rate 0.07976644307687256name module.module.external_feature_model.vit.decoder.layers.9.self_attention.linear_qkv.weight lr_decay_rate 0.20589113209464907 name module.module.external_feature_model.vit.decoder.layers.10.mlp.linear_fc2.weight lr_decay_rate 0.2287679245496101name module.module.external_feature_model.vit.decoder.layers.8.input_layernorm.bias lr_decay_rate 0.18530201888518416 name module.module.external_feature_model.vit.decoder.layers.15.ls1 lr_decay_rate 0.3874204890000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.input_layernorm.weight key (0.0, 0.02541865828329001, False, False) name module.module.external_feature_model.vit.decoder.layers.10.input_layernorm.weight lr_decay_rate 0.2287679245496101 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.pre_mlp_layernorm.bias key (0.0, 0.02058911320946491, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.input_layernorm.bias key (0.0, 0.02287679245496101, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.mlp.linear_fc1.weight key (1.0, 0.016677181699666577, False, False)name module.module.external_feature_model.vit.decoder.layers.1.self_attention.linear_proj.weight lr_decay_rate 0.08862938119652507 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.mlp.linear_fc2.weight key (1.0, 0.02287679245496101, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.ls1 key (0.0, 0.03874204890000001, False, False)name module.module.external_feature_model.vit.decoder.layers.11.ls2 lr_decay_rate 0.2541865828329001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.pre_mlp_layernorm.bias key (0.0, 0.007976644307687256, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.self_attention.linear_qkv.weight key (1.0, 0.02058911320946491, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.input_layernorm.bias key (0.0, 0.018530201888518418, False, False) name module.module.external_feature_model.vit.decoder.layers.11.input_layernorm.bias lr_decay_rate 0.2541865828329001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.input_layernorm.weight key (0.0, 0.02287679245496101, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.self_attention.linear_proj.weight key (1.0, 0.008862938119652507, False, False)name module.module.external_feature_model.vit.decoder.layers.7.mlp.linear_fc1.bias lr_decay_rate 0.16677181699666577 name module.module.external_feature_model.vit.decoder.layers.9.mlp.linear_fc1.weight lr_decay_rate 0.20589113209464907 name module.module.external_feature_model.vit.decoder.layers.10.self_attention.linear_proj.weight lr_decay_rate 0.2287679245496101 name module.module.external_feature_model.vit.decoder.layers.10.mlp.linear_fc2.bias lr_decay_rate 0.2287679245496101 name module.module.external_feature_model.vit.decoder.layers.15.ls2 lr_decay_rate 0.3874204890000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.ls2 key (0.0, 0.02541865828329001, False, False) name module.module.external_feature_model.vit.decoder.layers.9.self_attention.linear_qkv.bias lr_decay_rate 0.20589113209464907 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.input_layernorm.bias key (0.0, 0.02541865828329001, False, False)name module.module.external_feature_model.vit.decoder.layers.0.mlp.linear_fc1.weight lr_decay_rate 0.07976644307687256 name module.module.external_feature_model.vit.decoder.layers.10.input_layernorm.bias lr_decay_rate 0.2287679245496101_get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.mlp.linear_fc1.bias key (0.0, 0.016677181699666577, False, False)name module.module.external_feature_model.vit.decoder.layers.8.self_attention.linear_proj.weight lr_decay_rate 0.18530201888518416 name module.module.external_feature_model.vit.decoder.layers.1.self_attention.linear_proj.bias lr_decay_rate 0.08862938119652507 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.mlp.linear_fc1.weight key (1.0, 0.02058911320946491, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.mlp.linear_fc2.bias key (0.0, 0.02287679245496101, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.self_attention.linear_proj.weight key (1.0, 0.02287679245496101, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.ls2 key (0.0, 0.03874204890000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.self_attention.linear_qkv.bias key (0.0, 0.02058911320946491, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.mlp.linear_fc1.weight key (1.0, 0.007976644307687256, False, False)name module.module.external_feature_model.vit.decoder.layers.11.input_layernorm.weight lr_decay_rate 0.2541865828329001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.input_layernorm.bias key (0.0, 0.02287679245496101, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.self_attention.linear_proj.bias key (0.0, 0.008862938119652507, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.self_attention.linear_proj.weight key (1.0, 0.018530201888518418, False, False) name module.module.external_feature_model.vit.decoder.layers.11.self_attention.linear_proj.weight lr_decay_rate 0.2541865828329001name module.module.external_feature_model.vit.decoder.layers.7.mlp.linear_fc2.weight lr_decay_rate 0.16677181699666577 name module.module.external_feature_model.vit.decoder.layers.9.mlp.linear_fc1.bias lr_decay_rate 0.20589113209464907 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.input_layernorm.weight key (0.0, 0.02541865828329001, False, False)name module.module.external_feature_model.vit.decoder.layers.11.ls1 lr_decay_rate 0.2541865828329001 name module.module.external_feature_model.vit.decoder.layers.10.self_attention.linear_proj.bias lr_decay_rate 0.2287679245496101name module.module.external_feature_model.vit.decoder.layers.15.input_layernorm.weight lr_decay_rate 0.3874204890000001name module.module.external_feature_model.vit.decoder.layers.0.mlp.linear_fc1.bias lr_decay_rate 0.07976644307687256 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.mlp.linear_fc2.weight key (1.0, 0.016677181699666577, False, False)name module.module.external_feature_model.vit.decoder.layers.10.self_attention.linear_proj.weight lr_decay_rate 0.2287679245496101_get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.mlp.linear_fc1.bias key (0.0, 0.02058911320946491, False, False) name module.module.external_feature_model.vit.decoder.layers.9.pre_mlp_layernorm.weight lr_decay_rate 0.20589113209464907name module.module.external_feature_model.vit.decoder.layers.8.self_attention.linear_proj.bias lr_decay_rate 0.18530201888518416name module.module.external_feature_model.vit.decoder.layers.1.self_attention.linear_qkv.weight lr_decay_rate 0.08862938119652507 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.self_attention.linear_proj.weight key (1.0, 0.02541865828329001, False, False) name module.module.external_feature_model.vit.decoder.layers.11.input_layernorm.bias lr_decay_rate 0.2541865828329001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.ls1 key (0.0, 0.02541865828329001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.input_layernorm.weight key (0.0, 0.03874204890000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.self_attention.linear_proj.bias key (0.0, 0.02287679245496101, False, False) name module.module.external_feature_model.vit.decoder.layers.9.mlp.linear_fc2.weight lr_decay_rate 0.20589113209464907_get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.self_attention.linear_qkv.weight key (1.0, 0.008862938119652507, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.mlp.linear_fc1.bias key (0.0, 0.007976644307687256, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.self_attention.linear_proj.weight key (1.0, 0.02287679245496101, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.pre_mlp_layernorm.weight key (0.0, 0.02058911320946491, False, False) name module.module.external_feature_model.vit.decoder.layers.7.mlp.linear_fc2.bias lr_decay_rate 0.16677181699666577name module.module.external_feature_model.vit.decoder.layers.11.self_attention.linear_proj.bias lr_decay_rate 0.2541865828329001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.self_attention.linear_proj.bias key (0.0, 0.018530201888518418, False, False)name module.module.external_feature_model.vit.decoder.layers.11.ls2 lr_decay_rate 0.2541865828329001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.input_layernorm.bias key (0.0, 0.02541865828329001, False, False) name module.module.external_feature_model.vit.decoder.layers.15.input_layernorm.bias lr_decay_rate 0.3874204890000001name module.module.external_feature_model.vit.decoder.layers.1.self_attention.linear_qkv.bias lr_decay_rate 0.08862938119652507_get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.mlp.linear_fc2.weight key (1.0, 0.02058911320946491, False, False) name module.module.external_feature_model.vit.decoder.layers.10.self_attention.linear_qkv.weight lr_decay_rate 0.2287679245496101 name module.module.external_feature_model.vit.decoder.layers.0.mlp.linear_fc2.weight lr_decay_rate 0.07976644307687256 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.self_attention.linear_proj.bias key (0.0, 0.02541865828329001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.ls2 key (0.0, 0.02541865828329001, False, False)name module.module.external_feature_model.vit.decoder.layers.10.self_attention.linear_proj.bias lr_decay_rate 0.2287679245496101 name module.module.external_feature_model.vit.decoder.layers.9.pre_mlp_layernorm.bias lr_decay_rate 0.20589113209464907 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.mlp.linear_fc2.bias key (0.0, 0.016677181699666577, False, False)name module.module.external_feature_model.vit.decoder.layers.8.self_attention.linear_qkv.weight lr_decay_rate 0.18530201888518416 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.input_layernorm.bias key (0.0, 0.03874204890000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.self_attention.linear_qkv.bias key (0.0, 0.008862938119652507, False, False) name module.module.external_feature_model.vit.decoder.layers.9.mlp.linear_fc2.bias lr_decay_rate 0.20589113209464907 name module.module.external_feature_model.vit.decoder.layers.11.self_attention.linear_proj.weight lr_decay_rate 0.2541865828329001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.self_attention.linear_qkv.weight key (1.0, 0.02287679245496101, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.mlp.linear_fc2.weight key (1.0, 0.007976644307687256, False, False)name module.module.external_feature_model.vit.decoder.layers.11.self_attention.linear_qkv.weight lr_decay_rate 0.2541865828329001 name module.module.external_feature_model.vit.decoder.layers.11.input_layernorm.weight lr_decay_rate 0.2541865828329001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.self_attention.linear_qkv.weight key (1.0, 0.018530201888518418, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.pre_mlp_layernorm.bias key (0.0, 0.02058911320946491, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.self_attention.linear_proj.bias key (0.0, 0.02287679245496101, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.mlp.linear_fc2.bias key (0.0, 0.02058911320946491, False, False)name module.module.external_feature_model.vit.decoder.layers.8.ls1 lr_decay_rate 0.18530201888518416 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.self_attention.linear_proj.weight key (1.0, 0.02541865828329001, False, False)name module.module.external_feature_model.vit.decoder.layers.1.pre_mlp_layernorm.weight lr_decay_rate 0.08862938119652507 name module.module.external_feature_model.vit.decoder.layers.15.self_attention.linear_proj.weight lr_decay_rate 0.3874204890000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.self_attention.linear_qkv.weight key (1.0, 0.02541865828329001, False, False)name module.module.external_feature_model.vit.decoder.layers.10.self_attention.linear_qkv.bias lr_decay_rate 0.2287679245496101 name module.module.external_feature_model.vit.decoder.layers.0.mlp.linear_fc2.bias lr_decay_rate 0.07976644307687256 name module.module.external_feature_model.vit.decoder.layers.8.self_attention.linear_qkv.bias lr_decay_rate 0.18530201888518416_get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.input_layernorm.weight key (0.0, 0.02541865828329001, False, False) name module.module.external_feature_model.vit.decoder.layers.10.self_attention.linear_qkv.weight lr_decay_rate 0.2287679245496101 name module.module.external_feature_model.vit.decoder.layers.9.mlp.linear_fc1.weight lr_decay_rate 0.20589113209464907name module.module.external_feature_model.vit.decoder.layers.10.ls1 lr_decay_rate 0.2287679245496101 name module.module.external_feature_model.vit.decoder.layers.11.self_attention.linear_proj.bias lr_decay_rate 0.2541865828329001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.ls1 key (0.0, 0.018530201888518418, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.pre_mlp_layernorm.weight key (0.0, 0.008862938119652507, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.self_attention.linear_proj.weight key (1.0, 0.03874204890000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.mlp.linear_fc2.bias key (0.0, 0.007976644307687256, False, False)name module.module.external_feature_model.vit.decoder.layers.11.self_attention.linear_qkv.bias lr_decay_rate 0.2541865828329001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.self_attention.linear_qkv.bias key (0.0, 0.02287679245496101, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.self_attention.linear_qkv.bias key (0.0, 0.018530201888518418, False, False) name module.module.external_feature_model.vit.decoder.layers.11.input_layernorm.bias lr_decay_rate 0.2541865828329001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.mlp.linear_fc1.weight key (1.0, 0.02058911320946491, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.self_attention.linear_qkv.weight key (1.0, 0.02287679245496101, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.self_attention.linear_proj.bias key (0.0, 0.02541865828329001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.ls1 key (0.0, 0.02287679245496101, False, False) name module.module.external_feature_model.vit.decoder.layers.8.ls2 lr_decay_rate 0.18530201888518416 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.self_attention.linear_qkv.bias key (0.0, 0.02541865828329001, False, False)name module.module.external_feature_model.vit.decoder.layers.1.pre_mlp_layernorm.bias lr_decay_rate 0.08862938119652507name module.module.external_feature_model.vit.decoder.layers.15.self_attention.linear_proj.bias lr_decay_rate 0.3874204890000001 name module.module.external_feature_model.vit.decoder.layers.1.ls1 lr_decay_rate 0.08862938119652507 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.input_layernorm.bias key (0.0, 0.02541865828329001, False, False)name module.module.external_feature_model.vit.decoder.layers.10.self_attention.linear_qkv.bias lr_decay_rate 0.2287679245496101 name module.module.external_feature_model.vit.decoder.layers.9.mlp.linear_fc1.bias lr_decay_rate 0.20589113209464907 name module.module.external_feature_model.vit.decoder.layers.10.pre_mlp_layernorm.weight lr_decay_rate 0.2287679245496101name module.module.external_feature_model.vit.decoder.layers.8.pre_mlp_layernorm.weight lr_decay_rate 0.18530201888518416 name module.module.external_feature_model.vit.decoder.layers.11.self_attention.linear_qkv.weight lr_decay_rate 0.2541865828329001name module.module.external_feature_model.vit.decoder.layers.10.ls2 lr_decay_rate 0.2287679245496101 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.pre_mlp_layernorm.bias key (0.0, 0.008862938119652507, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.ls2 key (0.0, 0.018530201888518418, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.ls1 key (0.0, 0.008862938119652507, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.self_attention.linear_proj.bias key (0.0, 0.03874204890000001, False, False) name module.module.external_feature_model.vit.decoder.layers.11.pre_mlp_layernorm.weight lr_decay_rate 0.2541865828329001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.self_attention.linear_qkv.bias key (0.0, 0.02287679245496101, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.pre_mlp_layernorm.weight key (0.0, 0.018530201888518418, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.mlp.linear_fc1.bias key (0.0, 0.02058911320946491, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.ls2 key (0.0, 0.02287679245496101, False, False) name module.module.external_feature_model.vit.decoder.layers.11.self_attention.linear_proj.weight lr_decay_rate 0.2541865828329001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.pre_mlp_layernorm.weight key (0.0, 0.02287679245496101, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.self_attention.linear_qkv.weight key (1.0, 0.02541865828329001, False, False) name module.module.external_feature_model.vit.decoder.layers.8.input_layernorm.weight lr_decay_rate 0.18530201888518416 name module.module.external_feature_model.vit.decoder.layers.15.self_attention.linear_qkv.weight lr_decay_rate 0.3874204890000001 name module.module.external_feature_model.vit.decoder.layers.8.pre_mlp_layernorm.bias lr_decay_rate 0.18530201888518416name module.module.external_feature_model.vit.decoder.layers.1.ls2 lr_decay_rate 0.08862938119652507_get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.pre_mlp_layernorm.weight key (0.0, 0.02541865828329001, False, False)name module.module.external_feature_model.vit.decoder.layers.9.mlp.linear_fc2.weight lr_decay_rate 0.20589113209464907name module.module.external_feature_model.vit.decoder.layers.1.mlp.linear_fc1.weight lr_decay_rate 0.08862938119652507 name module.module.external_feature_model.vit.decoder.layers.10.pre_mlp_layernorm.bias lr_decay_rate 0.2287679245496101 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.self_attention.linear_qkv.weight key (1.0, 0.03874204890000001, False, False)name module.module.external_feature_model.vit.decoder.layers.11.self_attention.linear_qkv.bias lr_decay_rate 0.2541865828329001 name module.module.external_feature_model.vit.decoder.layers.10.pre_mlp_layernorm.weight lr_decay_rate 0.2287679245496101_get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.self_attention.linear_proj.weight key (1.0, 0.02541865828329001, False, False)name module.module.external_feature_model.vit.decoder.layers.10.input_layernorm.weight lr_decay_rate 0.2287679245496101 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.input_layernorm.weight key (0.0, 0.018530201888518418, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.pre_mlp_layernorm.bias key (0.0, 0.02287679245496101, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.pre_mlp_layernorm.bias key (0.0, 0.018530201888518418, False, False) name module.module.external_feature_model.vit.decoder.layers.11.pre_mlp_layernorm.bias lr_decay_rate 0.2541865828329001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.ls2 key (0.0, 0.008862938119652507, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.mlp.linear_fc1.weight key (1.0, 0.008862938119652507, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.mlp.linear_fc2.weight key (1.0, 0.02058911320946491, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.self_attention.linear_qkv.bias key (0.0, 0.02541865828329001, False, False) name module.module.external_feature_model.vit.decoder.layers.15.self_attention.linear_qkv.bias lr_decay_rate 0.3874204890000001name module.module.external_feature_model.vit.decoder.layers.11.self_attention.linear_proj.bias lr_decay_rate 0.2541865828329001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.pre_mlp_layernorm.weight key (0.0, 0.02287679245496101, False, False) name module.module.external_feature_model.vit.decoder.layers.8.input_layernorm.bias lr_decay_rate 0.18530201888518416_get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.input_layernorm.weight key (0.0, 0.02287679245496101, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.pre_mlp_layernorm.bias key (0.0, 0.02541865828329001, False, False)name module.module.external_feature_model.vit.decoder.layers.10.mlp.linear_fc1.weight lr_decay_rate 0.2287679245496101name module.module.external_feature_model.vit.decoder.layers.8.mlp.linear_fc1.weight lr_decay_rate 0.18530201888518416 name module.module.external_feature_model.vit.decoder.layers.9.mlp.linear_fc2.bias lr_decay_rate 0.20589113209464907 name module.module.external_feature_model.vit.decoder.layers.1.input_layernorm.weight lr_decay_rate 0.08862938119652507name module.module.external_feature_model.vit.decoder.layers.1.mlp.linear_fc1.bias lr_decay_rate 0.08862938119652507 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.self_attention.linear_qkv.bias key (0.0, 0.03874204890000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.self_attention.linear_proj.bias key (0.0, 0.02541865828329001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.input_layernorm.bias key (0.0, 0.018530201888518418, False, False)name module.module.external_feature_model.vit.decoder.layers.10.input_layernorm.bias lr_decay_rate 0.2287679245496101name module.module.external_feature_model.vit.decoder.layers.10.pre_mlp_layernorm.bias lr_decay_rate 0.2287679245496101 name module.module.external_feature_model.vit.decoder.layers.11.pre_mlp_layernorm.weight lr_decay_rate 0.2541865828329001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.mlp.linear_fc1.weight key (1.0, 0.02287679245496101, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.mlp.linear_fc2.bias key (0.0, 0.02058911320946491, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.mlp.linear_fc1.weight key (1.0, 0.018530201888518418, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.input_layernorm.weight key (0.0, 0.008862938119652507, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.mlp.linear_fc1.bias key (0.0, 0.008862938119652507, False, False)name module.module.external_feature_model.vit.decoder.layers.11.mlp.linear_fc1.weight lr_decay_rate 0.2541865828329001 name module.module.external_feature_model.vit.decoder.layers.11.self_attention.linear_qkv.weight lr_decay_rate 0.2541865828329001 name module.module.external_feature_model.vit.decoder.layers.15.pre_mlp_layernorm.weight lr_decay_rate 0.3874204890000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.input_layernorm.bias key (0.0, 0.02287679245496101, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.pre_mlp_layernorm.bias key (0.0, 0.02287679245496101, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.pre_mlp_layernorm.weight key (0.0, 0.02541865828329001, False, False) name module.module.external_feature_model.vit.decoder.layers.8.self_attention.linear_proj.weight lr_decay_rate 0.18530201888518416name module.module.external_feature_model.vit.decoder.layers.10.mlp.linear_fc1.bias lr_decay_rate 0.2287679245496101name module.module.external_feature_model.vit.decoder.layers.8.mlp.linear_fc1.bias lr_decay_rate 0.18530201888518416 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.mlp.linear_fc1.weight key (1.0, 0.02541865828329001, False, False) name module.module.external_feature_model.vit.decoder.layers.1.input_layernorm.bias lr_decay_rate 0.08862938119652507 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.self_attention.linear_qkv.weight key (1.0, 0.02541865828329001, False, False)name module.module.external_feature_model.vit.decoder.layers.10.ls1 lr_decay_rate 0.2287679245496101 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.pre_mlp_layernorm.weight key (0.0, 0.03874204890000001, False, False) name module.module.external_feature_model.vit.decoder.layers.1.mlp.linear_fc2.weight lr_decay_rate 0.08862938119652507 name module.module.external_feature_model.vit.decoder.layers.10.mlp.linear_fc1.weight lr_decay_rate 0.2287679245496101 name module.module.external_feature_model.vit.decoder.layers.11.pre_mlp_layernorm.bias lr_decay_rate 0.2541865828329001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.self_attention.linear_proj.weight key (1.0, 0.018530201888518418, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.mlp.linear_fc1.bias key (0.0, 0.02287679245496101, False, False)name module.module.external_feature_model.vit.decoder.layers.10.self_attention.linear_proj.weight lr_decay_rate 0.2287679245496101 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.mlp.linear_fc1.bias key (0.0, 0.018530201888518418, False, False)name module.module.external_feature_model.vit.decoder.layers.11.self_attention.linear_qkv.bias lr_decay_rate 0.2541865828329001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.input_layernorm.bias key (0.0, 0.008862938119652507, False, False) name module.module.external_feature_model.vit.decoder.layers.11.mlp.linear_fc1.bias lr_decay_rate 0.2541865828329001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.ls1 key (0.0, 0.02287679245496101, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.mlp.linear_fc2.weight key (1.0, 0.008862938119652507, False, False) name module.module.external_feature_model.vit.decoder.layers.15.pre_mlp_layernorm.bias lr_decay_rate 0.3874204890000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.mlp.linear_fc1.weight key (1.0, 0.02287679245496101, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.pre_mlp_layernorm.bias key (0.0, 0.02541865828329001, False, False) name module.module.external_feature_model.vit.decoder.layers.8.mlp.linear_fc2.weight lr_decay_rate 0.18530201888518416name module.module.external_feature_model.vit.decoder.layers.8.self_attention.linear_proj.bias lr_decay_rate 0.18530201888518416_get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.self_attention.linear_proj.weight key (1.0, 0.02287679245496101, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.self_attention.linear_qkv.bias key (0.0, 0.02541865828329001, False, False) name module.module.external_feature_model.vit.decoder.layers.10.mlp.linear_fc2.weight lr_decay_rate 0.2287679245496101 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.mlp.linear_fc1.bias key (0.0, 0.02541865828329001, False, False) name module.module.external_feature_model.vit.decoder.layers.1.mlp.linear_fc2.bias lr_decay_rate 0.08862938119652507_get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.pre_mlp_layernorm.bias key (0.0, 0.03874204890000001, False, False) name module.module.external_feature_model.vit.decoder.layers.1.self_attention.linear_proj.weight lr_decay_rate 0.08862938119652507name module.module.external_feature_model.vit.decoder.layers.11.mlp.linear_fc1.weight lr_decay_rate 0.2541865828329001name module.module.external_feature_model.vit.decoder.layers.10.mlp.linear_fc1.bias lr_decay_rate 0.2287679245496101 name module.module.external_feature_model.vit.decoder.layers.10.ls2 lr_decay_rate 0.2287679245496101 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.mlp.linear_fc2.weight key (1.0, 0.018530201888518418, False, False) name module.module.external_feature_model.vit.decoder.layers.10.self_attention.linear_proj.bias lr_decay_rate 0.2287679245496101_get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.self_attention.linear_proj.bias key (0.0, 0.018530201888518418, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.mlp.linear_fc2.bias key (0.0, 0.008862938119652507, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.mlp.linear_fc2.weight key (1.0, 0.02287679245496101, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.mlp.linear_fc1.weight key (1.0, 0.02541865828329001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.mlp.linear_fc1.bias key (0.0, 0.02287679245496101, False, False) name module.module.external_feature_model.vit.decoder.layers.11.mlp.linear_fc2.weight lr_decay_rate 0.2541865828329001name module.module.external_feature_model.vit.decoder.layers.11.pre_mlp_layernorm.weight lr_decay_rate 0.2541865828329001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.self_attention.linear_proj.weight key (1.0, 0.008862938119652507, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.ls2 key (0.0, 0.02287679245496101, False, False)name module.module.external_feature_model.vit.decoder.layers.15.mlp.linear_fc1.weight lr_decay_rate 0.3874204890000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.self_attention.linear_proj.bias key (0.0, 0.02287679245496101, False, False)name module.module.external_feature_model.vit.decoder.layers.8.mlp.linear_fc2.bias lr_decay_rate 0.18530201888518416 name module.module.external_feature_model.vit.decoder.layers.8.self_attention.linear_qkv.weight lr_decay_rate 0.18530201888518416_get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.mlp.linear_fc2.weight key (1.0, 0.02541865828329001, False, False)name module.module.external_feature_model.vit.decoder.layers.11.mlp.linear_fc1.bias lr_decay_rate 0.2541865828329001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.pre_mlp_layernorm.weight key (0.0, 0.02541865828329001, False, False)name module.module.external_feature_model.vit.decoder.layers.10.mlp.linear_fc2.bias lr_decay_rate 0.2287679245496101name module.module.external_feature_model.vit.decoder.layers.2.ls1 lr_decay_rate 0.09847709021836118 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.mlp.linear_fc2.bias key (0.0, 0.018530201888518418, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.mlp.linear_fc1.weight key (1.0, 0.03874204890000001, False, False)name module.module.external_feature_model.vit.decoder.layers.10.mlp.linear_fc2.weight lr_decay_rate 0.2287679245496101name module.module.external_feature_model.vit.decoder.layers.1.self_attention.linear_proj.bias lr_decay_rate 0.08862938119652507name module.module.external_feature_model.vit.decoder.layers.10.input_layernorm.weight lr_decay_rate 0.2287679245496101 name module.module.external_feature_model.vit.decoder.layers.10.self_attention.linear_qkv.weight lr_decay_rate 0.2287679245496101 name module.module.external_feature_model.vit.decoder.layers.11.mlp.linear_fc2.bias lr_decay_rate 0.2541865828329001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.self_attention.linear_qkv.weight key (1.0, 0.018530201888518418, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.mlp.linear_fc2.bias key (0.0, 0.02287679245496101, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.mlp.linear_fc1.bias key (0.0, 0.02541865828329001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.ls1 key (0.0, 0.00984770902183612, False, False)name module.module.external_feature_model.vit.decoder.layers.11.pre_mlp_layernorm.bias lr_decay_rate 0.2541865828329001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.input_layernorm.weight key (0.0, 0.02287679245496101, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.mlp.linear_fc2.weight key (1.0, 0.02287679245496101, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.self_attention.linear_proj.bias key (0.0, 0.008862938119652507, False, False) name module.module.external_feature_model.vit.decoder.layers.9.ls1 lr_decay_rate 0.20589113209464907name module.module.external_feature_model.vit.decoder.layers.15.mlp.linear_fc1.bias lr_decay_rate 0.3874204890000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.self_attention.linear_qkv.weight key (1.0, 0.02287679245496101, False, False) name module.module.external_feature_model.vit.decoder.layers.8.self_attention.linear_qkv.bias lr_decay_rate 0.18530201888518416 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.mlp.linear_fc2.bias key (0.0, 0.02541865828329001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.pre_mlp_layernorm.bias key (0.0, 0.02541865828329001, False, False) name module.module.external_feature_model.vit.decoder.layers.11.mlp.linear_fc2.weight lr_decay_rate 0.2541865828329001name module.module.external_feature_model.vit.decoder.layers.2.ls2 lr_decay_rate 0.09847709021836118name module.module.external_feature_model.vit.decoder.layers.11.ls1 lr_decay_rate 0.2541865828329001 name module.module.external_feature_model.vit.decoder.layers.10.mlp.linear_fc2.bias lr_decay_rate 0.2287679245496101name module.module.external_feature_model.vit.decoder.layers.10.input_layernorm.bias lr_decay_rate 0.2287679245496101name module.module.external_feature_model.vit.decoder.layers.10.self_attention.linear_qkv.bias lr_decay_rate 0.2287679245496101name module.module.external_feature_model.vit.decoder.layers.1.self_attention.linear_qkv.weight lr_decay_rate 0.08862938119652507 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.mlp.linear_fc1.bias key (0.0, 0.03874204890000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.ls1 key (0.0, 0.02058911320946491, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.self_attention.linear_qkv.bias key (0.0, 0.018530201888518418, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.ls2 key (0.0, 0.00984770902183612, False, False)name module.module.external_feature_model.vit.decoder.layers.12.ls1 lr_decay_rate 0.2824295364810001 name module.module.external_feature_model.vit.decoder.layers.11.mlp.linear_fc1.weight lr_decay_rate 0.2541865828329001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.mlp.linear_fc2.weight key (1.0, 0.02541865828329001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.input_layernorm.bias key (0.0, 0.02287679245496101, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.ls1 key (0.0, 0.02541865828329001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.mlp.linear_fc2.bias key (0.0, 0.02287679245496101, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.self_attention.linear_qkv.weight key (1.0, 0.008862938119652507, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.self_attention.linear_qkv.bias key (0.0, 0.02287679245496101, False, False) name module.module.external_feature_model.vit.decoder.layers.15.mlp.linear_fc2.weight lr_decay_rate 0.3874204890000001 name module.module.external_feature_model.vit.decoder.layers.9.ls2 lr_decay_rate 0.20589113209464907 name module.module.external_feature_model.vit.decoder.layers.11.mlp.linear_fc2.bias lr_decay_rate 0.2541865828329001name module.module.external_feature_model.vit.decoder.layers.2.input_layernorm.weight lr_decay_rate 0.09847709021836118 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.ls1 key (0.0, 0.028242953648100012, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.mlp.linear_fc1.weight key (1.0, 0.02541865828329001, False, False)name module.module.external_feature_model.vit.decoder.layers.8.pre_mlp_layernorm.weight lr_decay_rate 0.18530201888518416 name module.module.external_feature_model.vit.decoder.layers.11.ls2 lr_decay_rate 0.2541865828329001name module.module.external_feature_model.vit.decoder.layers.1.self_attention.linear_qkv.bias lr_decay_rate 0.08862938119652507 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.mlp.linear_fc2.weight key (1.0, 0.03874204890000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.mlp.linear_fc2.bias key (0.0, 0.02541865828329001, False, False) name module.module.external_feature_model.vit.decoder.layers.11.ls1 lr_decay_rate 0.2541865828329001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.ls2 key (0.0, 0.02058911320946491, False, False)name module.module.external_feature_model.vit.decoder.layers.10.self_attention.linear_proj.weight lr_decay_rate 0.2287679245496101_get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.input_layernorm.weight key (0.0, 0.00984770902183612, False, False) name module.module.external_feature_model.vit.decoder.layers.12.ls2 lr_decay_rate 0.2824295364810001 name module.module.external_feature_model.vit.decoder.layers.11.mlp.linear_fc1.bias lr_decay_rate 0.2541865828329001name module.module.external_feature_model.vit.decoder.layers.10.pre_mlp_layernorm.weight lr_decay_rate 0.2287679245496101 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.self_attention.linear_qkv.bias key (0.0, 0.008862938119652507, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.pre_mlp_layernorm.weight key (0.0, 0.018530201888518418, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.ls2 key (0.0, 0.02541865828329001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.ls2 key (0.0, 0.028242953648100012, False, False)name module.module.external_feature_model.vit.decoder.layers.15.mlp.linear_fc2.bias lr_decay_rate 0.3874204890000001 name module.module.external_feature_model.vit.decoder.layers.2.input_layernorm.bias lr_decay_rate 0.09847709021836118 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.ls1 key (0.0, 0.02541865828329001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.mlp.linear_fc1.bias key (0.0, 0.02541865828329001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.self_attention.linear_proj.weight key (1.0, 0.02287679245496101, False, False)name module.module.external_feature_model.vit.decoder.layers.12.ls1 lr_decay_rate 0.2824295364810001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.pre_mlp_layernorm.weight key (0.0, 0.02287679245496101, False, False) name module.module.external_feature_model.vit.decoder.layers.9.input_layernorm.weight lr_decay_rate 0.20589113209464907 name module.module.external_feature_model.vit.decoder.layers.8.pre_mlp_layernorm.bias lr_decay_rate 0.18530201888518416 name module.module.external_feature_model.vit.decoder.layers.11.input_layernorm.weight lr_decay_rate 0.2541865828329001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.input_layernorm.bias key (0.0, 0.00984770902183612, False, False) name module.module.external_feature_model.vit.decoder.layers.1.pre_mlp_layernorm.weight lr_decay_rate 0.08862938119652507 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.mlp.linear_fc2.bias key (0.0, 0.03874204890000001, False, False)name module.module.external_feature_model.vit.decoder.layers.12.input_layernorm.weight lr_decay_rate 0.2824295364810001 name module.module.external_feature_model.vit.decoder.layers.11.ls2 lr_decay_rate 0.2541865828329001 name module.module.external_feature_model.vit.decoder.layers.10.self_attention.linear_proj.bias lr_decay_rate 0.2287679245496101 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.ls1 key (0.0, 0.028242953648100012, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.pre_mlp_layernorm.bias key (0.0, 0.018530201888518418, False, False)name module.module.external_feature_model.vit.decoder.layers.11.mlp.linear_fc2.weight lr_decay_rate 0.2541865828329001 name module.module.external_feature_model.vit.decoder.layers.10.pre_mlp_layernorm.bias lr_decay_rate 0.2287679245496101_get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.input_layernorm.weight key (0.0, 0.02058911320946491, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.input_layernorm.weight key (0.0, 0.02541865828329001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.pre_mlp_layernorm.weight key (0.0, 0.008862938119652507, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.input_layernorm.weight key (0.0, 0.028242953648100012, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.ls2 key (0.0, 0.02541865828329001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.self_attention.linear_proj.bias key (0.0, 0.02287679245496101, False, False)name module.module.external_feature_model.vit.decoder.layers.2.self_attention.linear_proj.weight lr_decay_rate 0.09847709021836118name module.module.external_feature_model.vit.decoder.layers.16.ls1 lr_decay_rate 0.4304672100000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.mlp.linear_fc2.weight key (1.0, 0.02541865828329001, False, False)name module.module.external_feature_model.vit.decoder.layers.12.ls2 lr_decay_rate 0.2824295364810001name module.module.external_feature_model.vit.decoder.layers.9.input_layernorm.bias lr_decay_rate 0.20589113209464907_get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.pre_mlp_layernorm.bias key (0.0, 0.02287679245496101, False, False)name module.module.external_feature_model.vit.decoder.layers.8.mlp.linear_fc1.weight lr_decay_rate 0.18530201888518416 name module.module.external_feature_model.vit.decoder.layers.1.pre_mlp_layernorm.bias lr_decay_rate 0.08862938119652507name module.module.external_feature_model.vit.decoder.layers.12.input_layernorm.bias lr_decay_rate 0.2824295364810001 name module.module.external_feature_model.vit.decoder.layers.11.input_layernorm.bias lr_decay_rate 0.2541865828329001 name module.module.external_feature_model.vit.decoder.layers.11.input_layernorm.weight lr_decay_rate 0.2541865828329001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.self_attention.linear_proj.weight key (1.0, 0.00984770902183612, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.ls1 key (0.0, 0.04304672100000001, False, False) name module.module.external_feature_model.vit.decoder.layers.10.self_attention.linear_qkv.weight lr_decay_rate 0.2287679245496101_get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.ls2 key (0.0, 0.028242953648100012, False, False) name module.module.external_feature_model.vit.decoder.layers.11.mlp.linear_fc2.bias lr_decay_rate 0.2541865828329001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.pre_mlp_layernorm.bias key (0.0, 0.008862938119652507, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.input_layernorm.bias key (0.0, 0.02058911320946491, False, False) name module.module.external_feature_model.vit.decoder.layers.10.mlp.linear_fc1.weight lr_decay_rate 0.2287679245496101 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.mlp.linear_fc1.weight key (1.0, 0.018530201888518418, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.input_layernorm.bias key (0.0, 0.028242953648100012, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.input_layernorm.bias key (0.0, 0.02541865828329001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.input_layernorm.weight key (0.0, 0.02541865828329001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.self_attention.linear_qkv.weight key (1.0, 0.02287679245496101, False, False)name module.module.external_feature_model.vit.decoder.layers.2.self_attention.linear_proj.bias lr_decay_rate 0.09847709021836118name module.module.external_feature_model.vit.decoder.layers.16.ls2 lr_decay_rate 0.4304672100000001 name module.module.external_feature_model.vit.decoder.layers.12.input_layernorm.weight lr_decay_rate 0.2824295364810001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.mlp.linear_fc2.bias key (0.0, 0.02541865828329001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.mlp.linear_fc1.weight key (1.0, 0.02287679245496101, False, False)name module.module.external_feature_model.vit.decoder.layers.1.mlp.linear_fc1.weight lr_decay_rate 0.08862938119652507 name module.module.external_feature_model.vit.decoder.layers.8.mlp.linear_fc1.bias lr_decay_rate 0.18530201888518416 name module.module.external_feature_model.vit.decoder.layers.9.self_attention.linear_proj.weight lr_decay_rate 0.20589113209464907 name module.module.external_feature_model.vit.decoder.layers.10.self_attention.linear_qkv.bias lr_decay_rate 0.2287679245496101_get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.self_attention.linear_proj.bias key (0.0, 0.00984770902183612, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.ls2 key (0.0, 0.04304672100000001, False, False)name module.module.external_feature_model.vit.decoder.layers.11.input_layernorm.bias lr_decay_rate 0.2541865828329001name module.module.external_feature_model.vit.decoder.layers.11.self_attention.linear_proj.weight lr_decay_rate 0.2541865828329001name module.module.external_feature_model.vit.decoder.layers.12.self_attention.linear_proj.weight lr_decay_rate 0.2824295364810001 name module.module.external_feature_model.vit.decoder.layers.10.mlp.linear_fc1.bias lr_decay_rate 0.2287679245496101 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.mlp.linear_fc1.bias key (0.0, 0.018530201888518418, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.input_layernorm.weight key (0.0, 0.028242953648100012, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.mlp.linear_fc1.weight key (1.0, 0.008862938119652507, False, False) name module.module.external_feature_model.vit.decoder.layers.12.ls1 lr_decay_rate 0.2824295364810001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.self_attention.linear_proj.weight key (1.0, 0.02058911320946491, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.input_layernorm.bias key (0.0, 0.02541865828329001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.mlp.linear_fc1.bias key (0.0, 0.02287679245496101, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.self_attention.linear_proj.weight key (1.0, 0.028242953648100012, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.self_attention.linear_qkv.bias key (0.0, 0.02287679245496101, False, False) name module.module.external_feature_model.vit.decoder.layers.2.self_attention.linear_qkv.weight lr_decay_rate 0.09847709021836118name module.module.external_feature_model.vit.decoder.layers.8.mlp.linear_fc2.weight lr_decay_rate 0.18530201888518416 name module.module.external_feature_model.vit.decoder.layers.16.input_layernorm.weight lr_decay_rate 0.4304672100000001name module.module.external_feature_model.vit.decoder.layers.12.input_layernorm.bias lr_decay_rate 0.2824295364810001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.self_attention.linear_proj.weight key (1.0, 0.02541865828329001, False, False)name module.module.external_feature_model.vit.decoder.layers.9.self_attention.linear_proj.bias lr_decay_rate 0.20589113209464907_get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.ls1 key (0.0, 0.028242953648100012, False, False)name module.module.external_feature_model.vit.decoder.layers.1.mlp.linear_fc1.bias lr_decay_rate 0.08862938119652507 name module.module.external_feature_model.vit.decoder.layers.10.mlp.linear_fc2.weight lr_decay_rate 0.2287679245496101 name module.module.external_feature_model.vit.decoder.layers.12.self_attention.linear_proj.bias lr_decay_rate 0.2824295364810001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.self_attention.linear_qkv.weight key (1.0, 0.00984770902183612, False, False) name module.module.external_feature_model.vit.decoder.layers.11.self_attention.linear_proj.weight lr_decay_rate 0.2541865828329001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.mlp.linear_fc2.weight key (1.0, 0.018530201888518418, False, False)name module.module.external_feature_model.vit.decoder.layers.10.pre_mlp_layernorm.weight lr_decay_rate 0.2287679245496101 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.input_layernorm.weight key (0.0, 0.04304672100000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.input_layernorm.bias key (0.0, 0.028242953648100012, False, False) name module.module.external_feature_model.vit.decoder.layers.11.self_attention.linear_proj.bias lr_decay_rate 0.2541865828329001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.mlp.linear_fc1.bias key (0.0, 0.008862938119652507, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.mlp.linear_fc2.weight key (1.0, 0.02287679245496101, False, False)name module.module.external_feature_model.vit.decoder.layers.2.self_attention.linear_qkv.bias lr_decay_rate 0.09847709021836118 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.self_attention.linear_proj.bias key (0.0, 0.02058911320946491, False, False) name module.module.external_feature_model.vit.decoder.layers.12.ls2 lr_decay_rate 0.2824295364810001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.self_attention.linear_proj.bias key (0.0, 0.028242953648100012, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.self_attention.linear_proj.weight key (1.0, 0.02541865828329001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.pre_mlp_layernorm.weight key (0.0, 0.02287679245496101, False, False) name module.module.external_feature_model.vit.decoder.layers.8.mlp.linear_fc2.bias lr_decay_rate 0.18530201888518416 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.self_attention.linear_qkv.bias key (0.0, 0.00984770902183612, False, False) name module.module.external_feature_model.vit.decoder.layers.1.mlp.linear_fc2.weight lr_decay_rate 0.08862938119652507name module.module.external_feature_model.vit.decoder.layers.16.input_layernorm.bias lr_decay_rate 0.4304672100000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.self_attention.linear_proj.bias key (0.0, 0.02541865828329001, False, False) name module.module.external_feature_model.vit.decoder.layers.9.self_attention.linear_qkv.weight lr_decay_rate 0.20589113209464907_get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.ls2 key (0.0, 0.028242953648100012, False, False)name module.module.external_feature_model.vit.decoder.layers.12.self_attention.linear_proj.weight lr_decay_rate 0.2824295364810001name module.module.external_feature_model.vit.decoder.layers.10.mlp.linear_fc2.bias lr_decay_rate 0.2287679245496101 name module.module.external_feature_model.vit.decoder.layers.12.self_attention.linear_qkv.weight lr_decay_rate 0.2824295364810001name module.module.external_feature_model.vit.decoder.layers.10.pre_mlp_layernorm.bias lr_decay_rate 0.2287679245496101 name module.module.external_feature_model.vit.decoder.layers.11.self_attention.linear_proj.bias lr_decay_rate 0.2541865828329001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.mlp.linear_fc2.bias key (0.0, 0.018530201888518418, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.mlp.linear_fc2.weight key (1.0, 0.008862938119652507, False, False) name module.module.external_feature_model.vit.decoder.layers.2.pre_mlp_layernorm.weight lr_decay_rate 0.09847709021836118 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.input_layernorm.bias key (0.0, 0.04304672100000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.self_attention.linear_qkv.weight key (1.0, 0.02058911320946491, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.pre_mlp_layernorm.bias key (0.0, 0.02287679245496101, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.mlp.linear_fc2.bias key (0.0, 0.02287679245496101, False, False) name module.module.external_feature_model.vit.decoder.layers.11.self_attention.linear_qkv.weight lr_decay_rate 0.2541865828329001name module.module.external_feature_model.vit.decoder.layers.12.input_layernorm.weight lr_decay_rate 0.2824295364810001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.self_attention.linear_proj.weight key (1.0, 0.028242953648100012, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.self_attention.linear_qkv.weight key (1.0, 0.028242953648100012, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.self_attention.linear_proj.bias key (0.0, 0.02541865828329001, False, False) name module.module.external_feature_model.vit.decoder.layers.1.mlp.linear_fc2.bias lr_decay_rate 0.08862938119652507_get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.pre_mlp_layernorm.weight key (0.0, 0.00984770902183612, False, False) name module.module.external_feature_model.vit.decoder.layers.9.ls1 lr_decay_rate 0.20589113209464907name module.module.external_feature_model.vit.decoder.layers.9.self_attention.linear_qkv.bias lr_decay_rate 0.20589113209464907 name module.module.external_feature_model.vit.decoder.layers.10.mlp.linear_fc1.weight lr_decay_rate 0.2287679245496101name module.module.external_feature_model.vit.decoder.layers.16.self_attention.linear_proj.weight lr_decay_rate 0.4304672100000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.input_layernorm.weight key (0.0, 0.028242953648100012, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.self_attention.linear_qkv.weight key (1.0, 0.02541865828329001, False, False) name module.module.external_feature_model.vit.decoder.layers.12.self_attention.linear_proj.bias lr_decay_rate 0.2824295364810001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.mlp.linear_fc2.bias key (0.0, 0.008862938119652507, False, False)name module.module.external_feature_model.vit.decoder.layers.11.ls1 lr_decay_rate 0.2541865828329001name module.module.external_feature_model.vit.decoder.layers.12.self_attention.linear_qkv.bias lr_decay_rate 0.2824295364810001 name module.module.external_feature_model.vit.decoder.layers.2.pre_mlp_layernorm.bias lr_decay_rate 0.09847709021836118 name module.module.external_feature_model.vit.decoder.layers.11.self_attention.linear_qkv.weight lr_decay_rate 0.2541865828329001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.ls1 key (0.0, 0.02058911320946491, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.self_attention.linear_qkv.bias key (0.0, 0.02058911320946491, False, False) name module.module.external_feature_model.vit.decoder.layers.12.input_layernorm.bias lr_decay_rate 0.2824295364810001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.mlp.linear_fc1.weight key (1.0, 0.02287679245496101, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.self_attention.linear_proj.weight key (1.0, 0.04304672100000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.self_attention.linear_proj.bias key (0.0, 0.028242953648100012, False, False) name module.module.external_feature_model.vit.decoder.layers.11.self_attention.linear_qkv.bias lr_decay_rate 0.2541865828329001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.ls1 key (0.0, 0.02541865828329001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.self_attention.linear_qkv.bias key (0.0, 0.028242953648100012, False, False) name module.module.external_feature_model.vit.decoder.layers.2.ls1 lr_decay_rate 0.09847709021836118_get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.pre_mlp_layernorm.bias key (0.0, 0.00984770902183612, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.self_attention.linear_qkv.weight key (1.0, 0.02541865828329001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.input_layernorm.bias key (0.0, 0.028242953648100012, False, False)name module.module.external_feature_model.vit.decoder.layers.10.mlp.linear_fc1.bias lr_decay_rate 0.2287679245496101 name module.module.external_feature_model.vit.decoder.layers.9.ls2 lr_decay_rate 0.20589113209464907 name module.module.external_feature_model.vit.decoder.layers.16.self_attention.linear_proj.bias lr_decay_rate 0.4304672100000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.self_attention.linear_qkv.bias key (0.0, 0.02541865828329001, False, False) name module.module.external_feature_model.vit.decoder.layers.9.pre_mlp_layernorm.weight lr_decay_rate 0.20589113209464907name module.module.external_feature_model.vit.decoder.layers.12.self_attention.linear_qkv.weight lr_decay_rate 0.2824295364810001 name module.module.external_feature_model.vit.decoder.layers.11.ls2 lr_decay_rate 0.2541865828329001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.ls1 key (0.0, 0.00984770902183612, False, False) name module.module.external_feature_model.vit.decoder.layers.11.self_attention.linear_qkv.bias lr_decay_rate 0.2541865828329001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.mlp.linear_fc1.bias key (0.0, 0.02287679245496101, False, False) name module.module.external_feature_model.vit.decoder.layers.2.mlp.linear_fc1.weight lr_decay_rate 0.09847709021836118_get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.ls2 key (0.0, 0.02058911320946491, False, False)name module.module.external_feature_model.vit.decoder.layers.12.pre_mlp_layernorm.weight lr_decay_rate 0.2824295364810001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.self_attention.linear_proj.bias key (0.0, 0.04304672100000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.pre_mlp_layernorm.weight key (0.0, 0.02058911320946491, False, False) name module.module.external_feature_model.vit.decoder.layers.12.self_attention.linear_proj.weight lr_decay_rate 0.2824295364810001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.self_attention.linear_qkv.weight key (1.0, 0.028242953648100012, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.self_attention.linear_qkv.bias key (0.0, 0.02541865828329001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.ls2 key (0.0, 0.02541865828329001, False, False) name module.module.external_feature_model.vit.decoder.layers.2.ls2 lr_decay_rate 0.09847709021836118 name module.module.external_feature_model.vit.decoder.layers.11.pre_mlp_layernorm.weight lr_decay_rate 0.2541865828329001name module.module.external_feature_model.vit.decoder.layers.10.mlp.linear_fc2.weight lr_decay_rate 0.2287679245496101 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.mlp.linear_fc1.weight key (1.0, 0.00984770902183612, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.pre_mlp_layernorm.weight key (0.0, 0.028242953648100012, False, False) name module.module.external_feature_model.vit.decoder.layers.9.input_layernorm.weight lr_decay_rate 0.20589113209464907 name module.module.external_feature_model.vit.decoder.layers.16.self_attention.linear_qkv.weight lr_decay_rate 0.4304672100000001 name module.module.external_feature_model.vit.decoder.layers.9.pre_mlp_layernorm.bias lr_decay_rate 0.20589113209464907_get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.self_attention.linear_proj.weight key (1.0, 0.028242953648100012, False, False) name module.module.external_feature_model.vit.decoder.layers.12.self_attention.linear_qkv.bias lr_decay_rate 0.2824295364810001name module.module.external_feature_model.vit.decoder.layers.11.input_layernorm.weight lr_decay_rate 0.2541865828329001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.mlp.linear_fc2.weight key (1.0, 0.02287679245496101, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.ls2 key (0.0, 0.00984770902183612, False, False)name module.module.external_feature_model.vit.decoder.layers.11.pre_mlp_layernorm.weight lr_decay_rate 0.2541865828329001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.pre_mlp_layernorm.weight key (0.0, 0.02541865828329001, False, False) name module.module.external_feature_model.vit.decoder.layers.12.pre_mlp_layernorm.bias lr_decay_rate 0.2824295364810001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.input_layernorm.weight key (0.0, 0.02058911320946491, False, False) name module.module.external_feature_model.vit.decoder.layers.2.mlp.linear_fc1.bias lr_decay_rate 0.09847709021836118_get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.self_attention.linear_qkv.weight key (1.0, 0.04304672100000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.self_attention.linear_qkv.bias key (0.0, 0.028242953648100012, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.input_layernorm.weight key (0.0, 0.02541865828329001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.pre_mlp_layernorm.bias key (0.0, 0.02058911320946491, False, False) name module.module.external_feature_model.vit.decoder.layers.12.self_attention.linear_proj.bias lr_decay_rate 0.2824295364810001 name module.module.external_feature_model.vit.decoder.layers.10.mlp.linear_fc2.bias lr_decay_rate 0.2287679245496101_get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.pre_mlp_layernorm.weight key (0.0, 0.02541865828329001, False, False) name module.module.external_feature_model.vit.decoder.layers.11.pre_mlp_layernorm.bias lr_decay_rate 0.2541865828329001name module.module.external_feature_model.vit.decoder.layers.2.input_layernorm.weight lr_decay_rate 0.09847709021836118 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.pre_mlp_layernorm.bias key (0.0, 0.028242953648100012, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.mlp.linear_fc1.bias key (0.0, 0.00984770902183612, False, False)name module.module.external_feature_model.vit.decoder.layers.9.input_layernorm.bias lr_decay_rate 0.20589113209464907 name module.module.external_feature_model.vit.decoder.layers.11.input_layernorm.bias lr_decay_rate 0.2541865828329001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.self_attention.linear_proj.bias key (0.0, 0.028242953648100012, False, False)name module.module.external_feature_model.vit.decoder.layers.16.self_attention.linear_qkv.bias lr_decay_rate 0.4304672100000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.mlp.linear_fc2.bias key (0.0, 0.02287679245496101, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.pre_mlp_layernorm.bias key (0.0, 0.02541865828329001, False, False) name module.module.external_feature_model.vit.decoder.layers.12.pre_mlp_layernorm.weight lr_decay_rate 0.2824295364810001 name module.module.external_feature_model.vit.decoder.layers.9.mlp.linear_fc1.weight lr_decay_rate 0.20589113209464907name module.module.external_feature_model.vit.decoder.layers.11.pre_mlp_layernorm.bias lr_decay_rate 0.2541865828329001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.input_layernorm.weight key (0.0, 0.00984770902183612, False, False) name module.module.external_feature_model.vit.decoder.layers.2.mlp.linear_fc2.weight lr_decay_rate 0.09847709021836118_get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.self_attention.linear_qkv.bias key (0.0, 0.04304672100000001, False, False) name module.module.external_feature_model.vit.decoder.layers.12.mlp.linear_fc1.weight lr_decay_rate 0.2824295364810001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.input_layernorm.bias key (0.0, 0.02058911320946491, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.input_layernorm.bias key (0.0, 0.02541865828329001, False, False) name module.module.external_feature_model.vit.decoder.layers.12.self_attention.linear_qkv.weight lr_decay_rate 0.2824295364810001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.mlp.linear_fc1.weight key (1.0, 0.02058911320946491, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.pre_mlp_layernorm.weight key (0.0, 0.028242953648100012, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.pre_mlp_layernorm.bias key (0.0, 0.02541865828329001, False, False) name module.module.external_feature_model.vit.decoder.layers.11.mlp.linear_fc1.weight lr_decay_rate 0.2541865828329001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.mlp.linear_fc2.weight key (1.0, 0.00984770902183612, False, False)name module.module.external_feature_model.vit.decoder.layers.2.input_layernorm.bias lr_decay_rate 0.09847709021836118 name module.module.external_feature_model.vit.decoder.layers.11.ls1 lr_decay_rate 0.2541865828329001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.mlp.linear_fc1.weight key (1.0, 0.028242953648100012, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.self_attention.linear_qkv.weight key (1.0, 0.028242953648100012, False, False)name module.module.external_feature_model.vit.decoder.layers.16.pre_mlp_layernorm.weight lr_decay_rate 0.4304672100000001 name module.module.external_feature_model.vit.decoder.layers.9.self_attention.linear_proj.weight lr_decay_rate 0.20589113209464907name module.module.external_feature_model.vit.decoder.layers.11.self_attention.linear_proj.weight lr_decay_rate 0.2541865828329001name module.module.external_feature_model.vit.decoder.layers.12.pre_mlp_layernorm.bias lr_decay_rate 0.2824295364810001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.input_layernorm.bias key (0.0, 0.00984770902183612, False, False) name module.module.external_feature_model.vit.decoder.layers.9.mlp.linear_fc1.bias lr_decay_rate 0.20589113209464907_get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.mlp.linear_fc1.weight key (1.0, 0.02541865828329001, False, False)name module.module.external_feature_model.vit.decoder.layers.12.mlp.linear_fc1.bias lr_decay_rate 0.2824295364810001name module.module.external_feature_model.vit.decoder.layers.2.mlp.linear_fc2.bias lr_decay_rate 0.09847709021836118 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.ls1 key (0.0, 0.02541865828329001, False, False)name module.module.external_feature_model.vit.decoder.layers.11.mlp.linear_fc1.weight lr_decay_rate 0.2541865828329001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.pre_mlp_layernorm.weight key (0.0, 0.04304672100000001, False, False)name module.module.external_feature_model.vit.decoder.layers.12.self_attention.linear_qkv.bias lr_decay_rate 0.2824295364810001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.pre_mlp_layernorm.bias key (0.0, 0.028242953648100012, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.self_attention.linear_proj.weight key (1.0, 0.02541865828329001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.self_attention.linear_proj.weight key (1.0, 0.02058911320946491, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.mlp.linear_fc1.bias key (0.0, 0.02058911320946491, False, False) name module.module.external_feature_model.vit.decoder.layers.11.mlp.linear_fc1.bias lr_decay_rate 0.2541865828329001name module.module.external_feature_model.vit.decoder.layers.2.self_attention.linear_proj.weight lr_decay_rate 0.09847709021836118_get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.mlp.linear_fc1.bias key (0.0, 0.028242953648100012, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.self_attention.linear_qkv.bias key (0.0, 0.028242953648100012, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.mlp.linear_fc2.bias key (0.0, 0.00984770902183612, False, False)name module.module.external_feature_model.vit.decoder.layers.16.pre_mlp_layernorm.bias lr_decay_rate 0.4304672100000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.mlp.linear_fc1.weight key (1.0, 0.02541865828329001, False, False)name module.module.external_feature_model.vit.decoder.layers.11.ls2 lr_decay_rate 0.2541865828329001name module.module.external_feature_model.vit.decoder.layers.11.self_attention.linear_proj.bias lr_decay_rate 0.2541865828329001 name module.module.external_feature_model.vit.decoder.layers.12.mlp.linear_fc1.weight lr_decay_rate 0.2824295364810001 name module.module.external_feature_model.vit.decoder.layers.9.self_attention.linear_proj.bias lr_decay_rate 0.20589113209464907_get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.self_attention.linear_proj.weight key (1.0, 0.00984770902183612, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.mlp.linear_fc1.bias key (0.0, 0.02541865828329001, False, False) name module.module.external_feature_model.vit.decoder.layers.9.mlp.linear_fc2.weight lr_decay_rate 0.20589113209464907 name module.module.external_feature_model.vit.decoder.layers.12.mlp.linear_fc2.weight lr_decay_rate 0.2824295364810001name module.module.external_feature_model.vit.decoder.layers.12.pre_mlp_layernorm.weight lr_decay_rate 0.2824295364810001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.pre_mlp_layernorm.bias key (0.0, 0.04304672100000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.self_attention.linear_proj.bias key (0.0, 0.02541865828329001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.ls2 key (0.0, 0.02541865828329001, False, False)name module.module.external_feature_model.vit.decoder.layers.3.ls1 lr_decay_rate 0.10941898913151242_get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.mlp.linear_fc1.weight key (1.0, 0.028242953648100012, False, False)name module.module.external_feature_model.vit.decoder.layers.11.mlp.linear_fc1.bias lr_decay_rate 0.2541865828329001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.self_attention.linear_proj.bias key (0.0, 0.02058911320946491, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.mlp.linear_fc2.weight key (1.0, 0.02058911320946491, False, False) name module.module.external_feature_model.vit.decoder.layers.2.self_attention.linear_proj.bias lr_decay_rate 0.09847709021836118 name module.module.external_feature_model.vit.decoder.layers.11.mlp.linear_fc2.weight lr_decay_rate 0.2541865828329001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.pre_mlp_layernorm.weight key (0.0, 0.028242953648100012, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.mlp.linear_fc2.weight key (1.0, 0.028242953648100012, False, False) name module.module.external_feature_model.vit.decoder.layers.16.mlp.linear_fc1.weight lr_decay_rate 0.4304672100000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.mlp.linear_fc1.bias key (0.0, 0.02541865828329001, False, False)name module.module.external_feature_model.vit.decoder.layers.12.mlp.linear_fc1.bias lr_decay_rate 0.2824295364810001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.ls1 key (0.0, 0.010941898913151242, False, False) name module.module.external_feature_model.vit.decoder.layers.11.input_layernorm.weight lr_decay_rate 0.2541865828329001name module.module.external_feature_model.vit.decoder.layers.11.self_attention.linear_qkv.weight lr_decay_rate 0.2541865828329001 name module.module.external_feature_model.vit.decoder.layers.9.mlp.linear_fc2.bias lr_decay_rate 0.20589113209464907 name module.module.external_feature_model.vit.decoder.layers.9.self_attention.linear_qkv.weight lr_decay_rate 0.20589113209464907name module.module.external_feature_model.vit.decoder.layers.12.mlp.linear_fc2.bias lr_decay_rate 0.2824295364810001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.mlp.linear_fc1.bias key (0.0, 0.028242953648100012, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.self_attention.linear_proj.bias key (0.0, 0.00984770902183612, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.mlp.linear_fc2.weight key (1.0, 0.02541865828329001, False, False)name module.module.external_feature_model.vit.decoder.layers.12.pre_mlp_layernorm.bias lr_decay_rate 0.2824295364810001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.mlp.linear_fc1.weight key (1.0, 0.04304672100000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.input_layernorm.weight key (0.0, 0.02541865828329001, False, False)name module.module.external_feature_model.vit.decoder.layers.11.mlp.linear_fc2.weight lr_decay_rate 0.2541865828329001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.self_attention.linear_qkv.weight key (1.0, 0.02541865828329001, False, False)name module.module.external_feature_model.vit.decoder.layers.3.ls2 lr_decay_rate 0.10941898913151242 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.mlp.linear_fc2.bias key (0.0, 0.02058911320946491, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.mlp.linear_fc2.bias key (0.0, 0.028242953648100012, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.self_attention.linear_qkv.weight key (1.0, 0.02058911320946491, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.pre_mlp_layernorm.bias key (0.0, 0.028242953648100012, False, False)name module.module.external_feature_model.vit.decoder.layers.2.self_attention.linear_qkv.weight lr_decay_rate 0.09847709021836118name module.module.external_feature_model.vit.decoder.layers.12.mlp.linear_fc2.weight lr_decay_rate 0.2824295364810001 name module.module.external_feature_model.vit.decoder.layers.11.mlp.linear_fc2.bias lr_decay_rate 0.2541865828329001name module.module.external_feature_model.vit.decoder.layers.16.mlp.linear_fc1.bias lr_decay_rate 0.4304672100000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.ls2 key (0.0, 0.010941898913151242, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.mlp.linear_fc2.weight key (1.0, 0.02541865828329001, False, False) name module.module.external_feature_model.vit.decoder.layers.11.input_layernorm.bias lr_decay_rate 0.2541865828329001 name module.module.external_feature_model.vit.decoder.layers.9.self_attention.linear_qkv.bias lr_decay_rate 0.20589113209464907 name module.module.external_feature_model.vit.decoder.layers.10.ls1 lr_decay_rate 0.2287679245496101name module.module.external_feature_model.vit.decoder.layers.11.self_attention.linear_qkv.bias lr_decay_rate 0.2541865828329001 name module.module.external_feature_model.vit.decoder.layers.13.ls1 lr_decay_rate 0.31381059609000006_get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.self_attention.linear_qkv.weight key (1.0, 0.00984770902183612, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.mlp.linear_fc2.weight key (1.0, 0.028242953648100012, False, False) name module.module.external_feature_model.vit.decoder.layers.12.mlp.linear_fc1.weight lr_decay_rate 0.2824295364810001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.mlp.linear_fc2.bias key (0.0, 0.02541865828329001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.mlp.linear_fc1.bias key (0.0, 0.04304672100000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.self_attention.linear_qkv.bias key (0.0, 0.02058911320946491, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.input_layernorm.bias key (0.0, 0.02541865828329001, False, False) name module.module.external_feature_model.vit.decoder.layers.11.mlp.linear_fc2.bias lr_decay_rate 0.2541865828329001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.self_attention.linear_qkv.bias key (0.0, 0.02541865828329001, False, False) name module.module.external_feature_model.vit.decoder.layers.3.input_layernorm.weight lr_decay_rate 0.10941898913151242 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.ls1 key (0.0, 0.02287679245496101, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.mlp.linear_fc1.weight key (1.0, 0.028242953648100012, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.ls1 key (0.0, 0.031381059609000006, False, False)name module.module.external_feature_model.vit.decoder.layers.2.self_attention.linear_qkv.bias lr_decay_rate 0.09847709021836118 name module.module.external_feature_model.vit.decoder.layers.12.mlp.linear_fc2.bias lr_decay_rate 0.2824295364810001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.mlp.linear_fc2.bias key (0.0, 0.02541865828329001, False, False) name module.module.external_feature_model.vit.decoder.layers.16.mlp.linear_fc2.weight lr_decay_rate 0.4304672100000001name module.module.external_feature_model.vit.decoder.layers.12.ls1 lr_decay_rate 0.2824295364810001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.input_layernorm.weight key (0.0, 0.010941898913151242, False, False) name module.module.external_feature_model.vit.decoder.layers.10.ls2 lr_decay_rate 0.2287679245496101 name module.module.external_feature_model.vit.decoder.layers.9.pre_mlp_layernorm.weight lr_decay_rate 0.20589113209464907name module.module.external_feature_model.vit.decoder.layers.11.self_attention.linear_proj.weight lr_decay_rate 0.2541865828329001name module.module.external_feature_model.vit.decoder.layers.11.pre_mlp_layernorm.weight lr_decay_rate 0.2541865828329001name module.module.external_feature_model.vit.decoder.layers.12.mlp.linear_fc1.bias lr_decay_rate 0.2824295364810001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.mlp.linear_fc2.bias key (0.0, 0.028242953648100012, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.self_attention.linear_qkv.bias key (0.0, 0.00984770902183612, False, False) name module.module.external_feature_model.vit.decoder.layers.13.ls2 lr_decay_rate 0.31381059609000006name module.module.external_feature_model.vit.decoder.layers.12.ls1 lr_decay_rate 0.2824295364810001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.mlp.linear_fc2.weight key (1.0, 0.04304672100000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.ls1 key (0.0, 0.028242953648100012, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.ls2 key (0.0, 0.02287679245496101, False, False)name module.module.external_feature_model.vit.decoder.layers.3.input_layernorm.bias lr_decay_rate 0.10941898913151242 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.pre_mlp_layernorm.weight key (0.0, 0.02541865828329001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.mlp.linear_fc1.bias key (0.0, 0.028242953648100012, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.pre_mlp_layernorm.weight key (0.0, 0.02058911320946491, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.ls1 key (0.0, 0.028242953648100012, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.self_attention.linear_proj.weight key (1.0, 0.02541865828329001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.ls2 key (0.0, 0.031381059609000006, False, False) name module.module.external_feature_model.vit.decoder.layers.12.ls2 lr_decay_rate 0.2824295364810001name module.module.external_feature_model.vit.decoder.layers.2.pre_mlp_layernorm.weight lr_decay_rate 0.09847709021836118_get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.input_layernorm.bias key (0.0, 0.010941898913151242, False, False) name module.module.external_feature_model.vit.decoder.layers.10.input_layernorm.weight lr_decay_rate 0.2287679245496101name module.module.external_feature_model.vit.decoder.layers.13.ls1 lr_decay_rate 0.31381059609000006 name module.module.external_feature_model.vit.decoder.layers.16.mlp.linear_fc2.bias lr_decay_rate 0.4304672100000001 name module.module.external_feature_model.vit.decoder.layers.11.pre_mlp_layernorm.bias lr_decay_rate 0.2541865828329001 name module.module.external_feature_model.vit.decoder.layers.9.pre_mlp_layernorm.bias lr_decay_rate 0.20589113209464907 name module.module.external_feature_model.vit.decoder.layers.12.mlp.linear_fc2.weight lr_decay_rate 0.2824295364810001 name module.module.external_feature_model.vit.decoder.layers.12.ls2 lr_decay_rate 0.2824295364810001 name module.module.external_feature_model.vit.decoder.layers.13.input_layernorm.weight lr_decay_rate 0.31381059609000006 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.input_layernorm.weight key (0.0, 0.02287679245496101, False, False)name module.module.external_feature_model.vit.decoder.layers.11.self_attention.linear_proj.bias lr_decay_rate 0.2541865828329001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.pre_mlp_layernorm.weight key (0.0, 0.00984770902183612, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.ls2 key (0.0, 0.028242953648100012, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.mlp.linear_fc2.bias key (0.0, 0.04304672100000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.ls1 key (0.0, 0.031381059609000006, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.pre_mlp_layernorm.bias key (0.0, 0.02058911320946491, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.pre_mlp_layernorm.bias key (0.0, 0.02541865828329001, False, False)name module.module.external_feature_model.vit.decoder.layers.3.self_attention.linear_proj.weight lr_decay_rate 0.10941898913151242_get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.ls2 key (0.0, 0.028242953648100012, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.mlp.linear_fc2.weight key (1.0, 0.028242953648100012, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.input_layernorm.weight key (0.0, 0.031381059609000006, False, False)name module.module.external_feature_model.vit.decoder.layers.2.pre_mlp_layernorm.bias lr_decay_rate 0.09847709021836118 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.self_attention.linear_proj.bias key (0.0, 0.02541865828329001, False, False) name module.module.external_feature_model.vit.decoder.layers.17.ls1 lr_decay_rate 0.4782969000000001name module.module.external_feature_model.vit.decoder.layers.10.input_layernorm.bias lr_decay_rate 0.2287679245496101 name module.module.external_feature_model.vit.decoder.layers.12.input_layernorm.weight lr_decay_rate 0.2824295364810001name module.module.external_feature_model.vit.decoder.layers.13.ls2 lr_decay_rate 0.31381059609000006_get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.pre_mlp_layernorm.bias key (0.0, 0.00984770902183612, False, False) name module.module.external_feature_model.vit.decoder.layers.12.input_layernorm.weight lr_decay_rate 0.2824295364810001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.self_attention.linear_proj.weight key (1.0, 0.010941898913151242, False, False) name module.module.external_feature_model.vit.decoder.layers.13.input_layernorm.bias lr_decay_rate 0.31381059609000006name module.module.external_feature_model.vit.decoder.layers.12.mlp.linear_fc2.bias lr_decay_rate 0.2824295364810001name module.module.external_feature_model.vit.decoder.layers.11.mlp.linear_fc1.weight lr_decay_rate 0.2541865828329001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.input_layernorm.bias key (0.0, 0.02287679245496101, False, False)name module.module.external_feature_model.vit.decoder.layers.9.mlp.linear_fc1.weight lr_decay_rate 0.20589113209464907name module.module.external_feature_model.vit.decoder.layers.11.self_attention.linear_qkv.weight lr_decay_rate 0.2541865828329001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.ls2 key (0.0, 0.031381059609000006, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.ls1 key (0.0, 0.04782969000000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.input_layernorm.weight key (0.0, 0.028242953648100012, False, False)name module.module.external_feature_model.vit.decoder.layers.2.mlp.linear_fc1.weight lr_decay_rate 0.09847709021836118_get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.input_layernorm.weight key (0.0, 0.028242953648100012, False, False) name module.module.external_feature_model.vit.decoder.layers.3.self_attention.linear_proj.bias lr_decay_rate 0.10941898913151242 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.input_layernorm.bias key (0.0, 0.031381059609000006, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.self_attention.linear_qkv.weight key (1.0, 0.02541865828329001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.mlp.linear_fc2.bias key (0.0, 0.028242953648100012, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.mlp.linear_fc1.weight key (1.0, 0.02541865828329001, False, False) name module.module.external_feature_model.vit.decoder.layers.17.ls2 lr_decay_rate 0.4782969000000001name module.module.external_feature_model.vit.decoder.layers.10.self_attention.linear_proj.weight lr_decay_rate 0.2287679245496101 name module.module.external_feature_model.vit.decoder.layers.12.input_layernorm.bias lr_decay_rate 0.2824295364810001 name module.module.external_feature_model.vit.decoder.layers.13.input_layernorm.weight lr_decay_rate 0.31381059609000006_get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.mlp.linear_fc1.weight key (1.0, 0.00984770902183612, False, False)name module.module.external_feature_model.vit.decoder.layers.12.input_layernorm.bias lr_decay_rate 0.2824295364810001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.mlp.linear_fc1.weight key (1.0, 0.02058911320946491, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.self_attention.linear_proj.bias key (0.0, 0.010941898913151242, False, False) name module.module.external_feature_model.vit.decoder.layers.11.self_attention.linear_qkv.bias lr_decay_rate 0.2541865828329001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.ls2 key (0.0, 0.04782969000000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.self_attention.linear_proj.weight key (1.0, 0.02287679245496101, False, False) name module.module.external_feature_model.vit.decoder.layers.11.mlp.linear_fc1.bias lr_decay_rate 0.2541865828329001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.input_layernorm.bias key (0.0, 0.028242953648100012, False, False) name module.module.external_feature_model.vit.decoder.layers.13.ls1 lr_decay_rate 0.31381059609000006name module.module.external_feature_model.vit.decoder.layers.13.self_attention.linear_proj.weight lr_decay_rate 0.31381059609000006 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.input_layernorm.bias key (0.0, 0.028242953648100012, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.input_layernorm.weight key (0.0, 0.031381059609000006, False, False)name module.module.external_feature_model.vit.decoder.layers.2.mlp.linear_fc1.bias lr_decay_rate 0.09847709021836118 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.self_attention.linear_qkv.bias key (0.0, 0.02541865828329001, False, False)name module.module.external_feature_model.vit.decoder.layers.3.self_attention.linear_qkv.weight lr_decay_rate 0.10941898913151242name module.module.external_feature_model.vit.decoder.layers.10.self_attention.linear_proj.bias lr_decay_rate 0.2287679245496101name module.module.external_feature_model.vit.decoder.layers.9.mlp.linear_fc1.bias lr_decay_rate 0.20589113209464907 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.mlp.linear_fc1.bias key (0.0, 0.02541865828329001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.ls1 key (0.0, 0.031381059609000006, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.self_attention.linear_proj.weight key (1.0, 0.031381059609000006, False, False)name module.module.external_feature_model.vit.decoder.layers.13.input_layernorm.bias lr_decay_rate 0.31381059609000006name module.module.external_feature_model.vit.decoder.layers.17.input_layernorm.weight lr_decay_rate 0.4782969000000001 name module.module.external_feature_model.vit.decoder.layers.12.self_attention.linear_proj.weight lr_decay_rate 0.2824295364810001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.mlp.linear_fc1.bias key (0.0, 0.00984770902183612, False, False) name module.module.external_feature_model.vit.decoder.layers.12.self_attention.linear_proj.weight lr_decay_rate 0.2824295364810001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.self_attention.linear_qkv.weight key (1.0, 0.010941898913151242, False, False) name module.module.external_feature_model.vit.decoder.layers.11.pre_mlp_layernorm.weight lr_decay_rate 0.2541865828329001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.self_attention.linear_proj.bias key (0.0, 0.02287679245496101, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.mlp.linear_fc1.bias key (0.0, 0.02058911320946491, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.input_layernorm.bias key (0.0, 0.031381059609000006, False, False) name module.module.external_feature_model.vit.decoder.layers.13.ls2 lr_decay_rate 0.31381059609000006 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.input_layernorm.weight key (0.0, 0.04782969000000001, False, False)name module.module.external_feature_model.vit.decoder.layers.13.self_attention.linear_proj.bias lr_decay_rate 0.31381059609000006 name module.module.external_feature_model.vit.decoder.layers.11.mlp.linear_fc2.weight lr_decay_rate 0.2541865828329001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.pre_mlp_layernorm.weight key (0.0, 0.02541865828329001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.self_attention.linear_proj.weight key (1.0, 0.028242953648100012, False, False) name module.module.external_feature_model.vit.decoder.layers.2.mlp.linear_fc2.weight lr_decay_rate 0.09847709021836118 name module.module.external_feature_model.vit.decoder.layers.3.self_attention.linear_qkv.bias lr_decay_rate 0.10941898913151242 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.self_attention.linear_proj.weight key (1.0, 0.028242953648100012, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.ls2 key (0.0, 0.031381059609000006, False, False)name module.module.external_feature_model.vit.decoder.layers.10.self_attention.linear_qkv.weight lr_decay_rate 0.2287679245496101 name module.module.external_feature_model.vit.decoder.layers.9.mlp.linear_fc2.weight lr_decay_rate 0.20589113209464907 name module.module.external_feature_model.vit.decoder.layers.17.input_layernorm.bias lr_decay_rate 0.4782969000000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.mlp.linear_fc2.weight key (1.0, 0.02541865828329001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.mlp.linear_fc2.weight key (1.0, 0.00984770902183612, False, False)name module.module.external_feature_model.vit.decoder.layers.13.self_attention.linear_proj.weight lr_decay_rate 0.31381059609000006_get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.self_attention.linear_qkv.bias key (0.0, 0.010941898913151242, False, False) name module.module.external_feature_model.vit.decoder.layers.12.self_attention.linear_proj.bias lr_decay_rate 0.2824295364810001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.self_attention.linear_proj.bias key (0.0, 0.031381059609000006, False, False) name module.module.external_feature_model.vit.decoder.layers.11.pre_mlp_layernorm.bias lr_decay_rate 0.2541865828329001name module.module.external_feature_model.vit.decoder.layers.12.self_attention.linear_proj.bias lr_decay_rate 0.2824295364810001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.mlp.linear_fc2.weight key (1.0, 0.02058911320946491, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.self_attention.linear_qkv.weight key (1.0, 0.02287679245496101, False, False) name module.module.external_feature_model.vit.decoder.layers.13.input_layernorm.weight lr_decay_rate 0.31381059609000006_get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.input_layernorm.bias key (0.0, 0.04782969000000001, False, False) name module.module.external_feature_model.vit.decoder.layers.11.mlp.linear_fc2.bias lr_decay_rate 0.2541865828329001 name module.module.external_feature_model.vit.decoder.layers.2.mlp.linear_fc2.bias lr_decay_rate 0.09847709021836118_get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.self_attention.linear_proj.weight key (1.0, 0.031381059609000006, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.self_attention.linear_proj.bias key (0.0, 0.028242953648100012, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.pre_mlp_layernorm.bias key (0.0, 0.02541865828329001, False, False)name module.module.external_feature_model.vit.decoder.layers.3.pre_mlp_layernorm.weight lr_decay_rate 0.10941898913151242 name module.module.external_feature_model.vit.decoder.layers.9.mlp.linear_fc2.bias lr_decay_rate 0.20589113209464907name module.module.external_feature_model.vit.decoder.layers.13.self_attention.linear_qkv.weight lr_decay_rate 0.31381059609000006 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.self_attention.linear_proj.bias key (0.0, 0.028242953648100012, False, False) name module.module.external_feature_model.vit.decoder.layers.10.self_attention.linear_qkv.bias lr_decay_rate 0.2287679245496101_get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.mlp.linear_fc2.bias key (0.0, 0.00984770902183612, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.input_layernorm.weight key (0.0, 0.031381059609000006, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.mlp.linear_fc2.bias key (0.0, 0.02541865828329001, False, False) name module.module.external_feature_model.vit.decoder.layers.12.self_attention.linear_qkv.weight lr_decay_rate 0.2824295364810001 name module.module.external_feature_model.vit.decoder.layers.13.self_attention.linear_proj.bias lr_decay_rate 0.31381059609000006name module.module.external_feature_model.vit.decoder.layers.17.self_attention.linear_proj.weight lr_decay_rate 0.4782969000000001 name module.module.external_feature_model.vit.decoder.layers.11.mlp.linear_fc1.weight lr_decay_rate 0.2541865828329001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.pre_mlp_layernorm.weight key (0.0, 0.010941898913151242, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.mlp.linear_fc2.bias key (0.0, 0.02058911320946491, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.self_attention.linear_qkv.weight key (1.0, 0.031381059609000006, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.self_attention.linear_qkv.bias key (0.0, 0.02287679245496101, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.self_attention.linear_qkv.weight key (1.0, 0.028242953648100012, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.self_attention.linear_proj.bias key (0.0, 0.031381059609000006, False, False)name module.module.external_feature_model.vit.decoder.layers.12.self_attention.linear_qkv.weight lr_decay_rate 0.2824295364810001 name module.module.external_feature_model.vit.decoder.layers.13.input_layernorm.bias lr_decay_rate 0.31381059609000006name module.module.external_feature_model.vit.decoder.layers.3.ls1 lr_decay_rate 0.10941898913151242 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.self_attention.linear_proj.weight key (1.0, 0.04782969000000001, False, False)name module.module.external_feature_model.vit.decoder.layers.12.ls1 lr_decay_rate 0.2824295364810001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.mlp.linear_fc1.weight key (1.0, 0.02541865828329001, False, False)name module.module.external_feature_model.vit.decoder.layers.10.ls1 lr_decay_rate 0.2287679245496101name module.module.external_feature_model.vit.decoder.layers.3.pre_mlp_layernorm.bias lr_decay_rate 0.10941898913151242 name module.module.external_feature_model.vit.decoder.layers.13.self_attention.linear_qkv.bias lr_decay_rate 0.31381059609000006 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.ls1 key (0.0, 0.010941898913151242, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.input_layernorm.bias key (0.0, 0.031381059609000006, False, False) name module.module.external_feature_model.vit.decoder.layers.12.self_attention.linear_qkv.bias lr_decay_rate 0.2824295364810001name module.module.external_feature_model.vit.decoder.layers.13.self_attention.linear_qkv.weight lr_decay_rate 0.31381059609000006 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.self_attention.linear_qkv.weight key (1.0, 0.028242953648100012, False, False)name module.module.external_feature_model.vit.decoder.layers.10.pre_mlp_layernorm.weight lr_decay_rate 0.2287679245496101 name module.module.external_feature_model.vit.decoder.layers.17.self_attention.linear_proj.bias lr_decay_rate 0.4782969000000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.ls1 key (0.0, 0.028242953648100012, False, False)name module.module.external_feature_model.vit.decoder.layers.11.mlp.linear_fc1.bias lr_decay_rate 0.2541865828329001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.self_attention.linear_qkv.bias key (0.0, 0.031381059609000006, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.ls1 key (0.0, 0.02287679245496101, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.pre_mlp_layernorm.bias key (0.0, 0.010941898913151242, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.self_attention.linear_qkv.bias key (0.0, 0.028242953648100012, False, False)name module.module.external_feature_model.vit.decoder.layers.3.ls2 lr_decay_rate 0.10941898913151242 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.pre_mlp_layernorm.weight key (0.0, 0.02287679245496101, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.self_attention.linear_proj.bias key (0.0, 0.04782969000000001, False, False) name module.module.external_feature_model.vit.decoder.layers.12.self_attention.linear_qkv.bias lr_decay_rate 0.2824295364810001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.self_attention.linear_qkv.weight key (1.0, 0.031381059609000006, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.mlp.linear_fc1.bias key (0.0, 0.02541865828329001, False, False)name module.module.external_feature_model.vit.decoder.layers.13.self_attention.linear_proj.weight lr_decay_rate 0.31381059609000006 name module.module.external_feature_model.vit.decoder.layers.12.ls2 lr_decay_rate 0.2824295364810001name module.module.external_feature_model.vit.decoder.layers.10.ls2 lr_decay_rate 0.2287679245496101 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.ls2 key (0.0, 0.010941898913151242, False, False)name module.module.external_feature_model.vit.decoder.layers.3.mlp.linear_fc1.weight lr_decay_rate 0.10941898913151242name module.module.external_feature_model.vit.decoder.layers.13.pre_mlp_layernorm.weight lr_decay_rate 0.31381059609000006 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.self_attention.linear_qkv.bias key (0.0, 0.028242953648100012, False, False) name module.module.external_feature_model.vit.decoder.layers.10.pre_mlp_layernorm.bias lr_decay_rate 0.2287679245496101 name module.module.external_feature_model.vit.decoder.layers.17.self_attention.linear_qkv.weight lr_decay_rate 0.4782969000000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.ls2 key (0.0, 0.028242953648100012, False, False) name module.module.external_feature_model.vit.decoder.layers.12.pre_mlp_layernorm.weight lr_decay_rate 0.2824295364810001name module.module.external_feature_model.vit.decoder.layers.13.self_attention.linear_qkv.bias lr_decay_rate 0.31381059609000006name module.module.external_feature_model.vit.decoder.layers.11.mlp.linear_fc2.weight lr_decay_rate 0.2541865828329001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.self_attention.linear_proj.weight key (1.0, 0.031381059609000006, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.ls2 key (0.0, 0.02287679245496101, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.mlp.linear_fc1.weight key (1.0, 0.010941898913151242, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.pre_mlp_layernorm.weight key (0.0, 0.031381059609000006, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.pre_mlp_layernorm.bias key (0.0, 0.02287679245496101, False, False) name module.module.external_feature_model.vit.decoder.layers.3.input_layernorm.weight lr_decay_rate 0.10941898913151242 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.self_attention.linear_qkv.weight key (1.0, 0.04782969000000001, False, False)name module.module.external_feature_model.vit.decoder.layers.12.input_layernorm.weight lr_decay_rate 0.2824295364810001name module.module.external_feature_model.vit.decoder.layers.12.pre_mlp_layernorm.weight lr_decay_rate 0.2824295364810001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.pre_mlp_layernorm.weight key (0.0, 0.028242953648100012, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.mlp.linear_fc2.weight key (1.0, 0.02541865828329001, False, False) name module.module.external_feature_model.vit.decoder.layers.13.self_attention.linear_proj.bias lr_decay_rate 0.31381059609000006 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.self_attention.linear_qkv.bias key (0.0, 0.031381059609000006, False, False) name module.module.external_feature_model.vit.decoder.layers.3.mlp.linear_fc1.bias lr_decay_rate 0.10941898913151242 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.input_layernorm.weight key (0.0, 0.010941898913151242, False, False)name module.module.external_feature_model.vit.decoder.layers.10.input_layernorm.weight lr_decay_rate 0.2287679245496101name module.module.external_feature_model.vit.decoder.layers.13.pre_mlp_layernorm.bias lr_decay_rate 0.31381059609000006name module.module.external_feature_model.vit.decoder.layers.10.mlp.linear_fc1.weight lr_decay_rate 0.2287679245496101_get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.input_layernorm.weight key (0.0, 0.028242953648100012, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.pre_mlp_layernorm.weight key (0.0, 0.028242953648100012, False, False) name module.module.external_feature_model.vit.decoder.layers.17.self_attention.linear_qkv.bias lr_decay_rate 0.4782969000000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.self_attention.linear_proj.bias key (0.0, 0.031381059609000006, False, False) name module.module.external_feature_model.vit.decoder.layers.12.pre_mlp_layernorm.bias lr_decay_rate 0.2824295364810001name module.module.external_feature_model.vit.decoder.layers.11.mlp.linear_fc2.bias lr_decay_rate 0.2541865828329001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.mlp.linear_fc1.bias key (0.0, 0.010941898913151242, False, False) name module.module.external_feature_model.vit.decoder.layers.3.input_layernorm.bias lr_decay_rate 0.10941898913151242 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.input_layernorm.weight key (0.0, 0.02287679245496101, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.pre_mlp_layernorm.bias key (0.0, 0.031381059609000006, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.mlp.linear_fc1.weight key (1.0, 0.02287679245496101, False, False) name module.module.external_feature_model.vit.decoder.layers.12.input_layernorm.bias lr_decay_rate 0.2824295364810001 name module.module.external_feature_model.vit.decoder.layers.13.pre_mlp_layernorm.weight lr_decay_rate 0.31381059609000006_get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.self_attention.linear_qkv.bias key (0.0, 0.04782969000000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.pre_mlp_layernorm.bias key (0.0, 0.028242953648100012, False, False)name module.module.external_feature_model.vit.decoder.layers.12.pre_mlp_layernorm.bias lr_decay_rate 0.2824295364810001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.mlp.linear_fc2.bias key (0.0, 0.02541865828329001, False, False) name module.module.external_feature_model.vit.decoder.layers.13.self_attention.linear_qkv.weight lr_decay_rate 0.31381059609000006 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.input_layernorm.bias key (0.0, 0.010941898913151242, False, False) name module.module.external_feature_model.vit.decoder.layers.3.mlp.linear_fc2.weight lr_decay_rate 0.10941898913151242 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.input_layernorm.bias key (0.0, 0.028242953648100012, False, False)name module.module.external_feature_model.vit.decoder.layers.10.input_layernorm.bias lr_decay_rate 0.2287679245496101name module.module.external_feature_model.vit.decoder.layers.13.mlp.linear_fc1.weight lr_decay_rate 0.31381059609000006 name module.module.external_feature_model.vit.decoder.layers.10.mlp.linear_fc1.bias lr_decay_rate 0.2287679245496101 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.pre_mlp_layernorm.weight key (0.0, 0.031381059609000006, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.pre_mlp_layernorm.bias key (0.0, 0.028242953648100012, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.self_attention.linear_qkv.weight key (1.0, 0.031381059609000006, False, False)name module.module.external_feature_model.vit.decoder.layers.12.mlp.linear_fc1.weight lr_decay_rate 0.2824295364810001 name module.module.external_feature_model.vit.decoder.layers.12.ls1 lr_decay_rate 0.2824295364810001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.mlp.linear_fc2.weight key (1.0, 0.010941898913151242, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.input_layernorm.bias key (0.0, 0.02287679245496101, False, False)name module.module.external_feature_model.vit.decoder.layers.17.pre_mlp_layernorm.weight lr_decay_rate 0.4782969000000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.mlp.linear_fc1.bias key (0.0, 0.02287679245496101, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.mlp.linear_fc1.weight key (1.0, 0.031381059609000006, False, False) name module.module.external_feature_model.vit.decoder.layers.3.self_attention.linear_proj.weight lr_decay_rate 0.10941898913151242 name module.module.external_feature_model.vit.decoder.layers.12.self_attention.linear_proj.weight lr_decay_rate 0.2824295364810001name module.module.external_feature_model.vit.decoder.layers.13.self_attention.linear_qkv.bias lr_decay_rate 0.31381059609000006name module.module.external_feature_model.vit.decoder.layers.13.pre_mlp_layernorm.bias lr_decay_rate 0.31381059609000006 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.mlp.linear_fc1.weight key (1.0, 0.028242953648100012, False, False) name module.module.external_feature_model.vit.decoder.layers.12.mlp.linear_fc1.weight lr_decay_rate 0.2824295364810001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.pre_mlp_layernorm.weight key (0.0, 0.04782969000000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.ls1 key (0.0, 0.028242953648100012, False, False) name module.module.external_feature_model.vit.decoder.layers.3.mlp.linear_fc2.bias lr_decay_rate 0.10941898913151242 name module.module.external_feature_model.vit.decoder.layers.13.mlp.linear_fc1.bias lr_decay_rate 0.31381059609000006name module.module.external_feature_model.vit.decoder.layers.10.mlp.linear_fc2.weight lr_decay_rate 0.2287679245496101 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.self_attention.linear_proj.weight key (1.0, 0.010941898913151242, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.pre_mlp_layernorm.bias key (0.0, 0.031381059609000006, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.self_attention.linear_proj.weight key (1.0, 0.028242953648100012, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.self_attention.linear_qkv.bias key (0.0, 0.031381059609000006, False, False) name module.module.external_feature_model.vit.decoder.layers.10.self_attention.linear_proj.weight lr_decay_rate 0.2287679245496101 name module.module.external_feature_model.vit.decoder.layers.12.mlp.linear_fc1.bias lr_decay_rate 0.2824295364810001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.mlp.linear_fc1.weight key (1.0, 0.028242953648100012, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.mlp.linear_fc2.bias key (0.0, 0.010941898913151242, False, False) name module.module.external_feature_model.vit.decoder.layers.17.pre_mlp_layernorm.bias lr_decay_rate 0.4782969000000001 name module.module.external_feature_model.vit.decoder.layers.12.ls2 lr_decay_rate 0.2824295364810001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.mlp.linear_fc1.bias key (0.0, 0.031381059609000006, False, False) name module.module.external_feature_model.vit.decoder.layers.3.self_attention.linear_proj.bias lr_decay_rate 0.10941898913151242_get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.mlp.linear_fc2.weight key (1.0, 0.02287679245496101, False, False) name module.module.external_feature_model.vit.decoder.layers.13.mlp.linear_fc1.weight lr_decay_rate 0.31381059609000006 name module.module.external_feature_model.vit.decoder.layers.12.self_attention.linear_proj.bias lr_decay_rate 0.2824295364810001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.mlp.linear_fc1.bias key (0.0, 0.028242953648100012, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.self_attention.linear_proj.weight key (1.0, 0.02287679245496101, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.ls2 key (0.0, 0.028242953648100012, False, False)name module.module.external_feature_model.vit.decoder.layers.13.pre_mlp_layernorm.weight lr_decay_rate 0.31381059609000006_get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.pre_mlp_layernorm.bias key (0.0, 0.04782969000000001, False, False) name module.module.external_feature_model.vit.decoder.layers.12.mlp.linear_fc1.bias lr_decay_rate 0.2824295364810001name module.module.external_feature_model.vit.decoder.layers.4.ls1 lr_decay_rate 0.12157665459056935_get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.self_attention.linear_proj.bias key (0.0, 0.010941898913151242, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.self_attention.linear_proj.bias key (0.0, 0.028242953648100012, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.mlp.linear_fc1.weight key (1.0, 0.031381059609000006, False, False) name module.module.external_feature_model.vit.decoder.layers.10.mlp.linear_fc2.bias lr_decay_rate 0.2287679245496101name module.module.external_feature_model.vit.decoder.layers.13.mlp.linear_fc2.weight lr_decay_rate 0.31381059609000006 name module.module.external_feature_model.vit.decoder.layers.12.mlp.linear_fc2.weight lr_decay_rate 0.2824295364810001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.pre_mlp_layernorm.weight key (0.0, 0.031381059609000006, False, False) name module.module.external_feature_model.vit.decoder.layers.12.input_layernorm.weight lr_decay_rate 0.2824295364810001 name module.module.external_feature_model.vit.decoder.layers.10.self_attention.linear_proj.bias lr_decay_rate 0.2287679245496101 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.mlp.linear_fc1.bias key (0.0, 0.028242953648100012, False, False)name module.module.external_feature_model.vit.decoder.layers.17.mlp.linear_fc1.weight lr_decay_rate 0.4782969000000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.ls1 key (0.0, 0.012157665459056936, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.mlp.linear_fc2.bias key (0.0, 0.02287679245496101, False, False) name module.module.external_feature_model.vit.decoder.layers.3.self_attention.linear_qkv.weight lr_decay_rate 0.10941898913151242_get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.mlp.linear_fc2.weight key (1.0, 0.031381059609000006, False, False) name module.module.external_feature_model.vit.decoder.layers.13.mlp.linear_fc1.bias lr_decay_rate 0.31381059609000006 name module.module.external_feature_model.vit.decoder.layers.12.self_attention.linear_qkv.weight lr_decay_rate 0.2824295364810001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.mlp.linear_fc2.weight key (1.0, 0.028242953648100012, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.input_layernorm.weight key (0.0, 0.028242953648100012, False, False) name module.module.external_feature_model.vit.decoder.layers.13.pre_mlp_layernorm.bias lr_decay_rate 0.31381059609000006_get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.self_attention.linear_proj.bias key (0.0, 0.02287679245496101, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.mlp.linear_fc1.weight key (1.0, 0.04782969000000001, False, False)name module.module.external_feature_model.vit.decoder.layers.4.ls2 lr_decay_rate 0.12157665459056935 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.self_attention.linear_qkv.weight key (1.0, 0.010941898913151242, False, False)name module.module.external_feature_model.vit.decoder.layers.12.mlp.linear_fc2.weight lr_decay_rate 0.2824295364810001 name module.module.external_feature_model.vit.decoder.layers.13.mlp.linear_fc2.bias lr_decay_rate 0.31381059609000006 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.mlp.linear_fc1.bias key (0.0, 0.031381059609000006, False, False)name module.module.external_feature_model.vit.decoder.layers.11.ls1 lr_decay_rate 0.2541865828329001name module.module.external_feature_model.vit.decoder.layers.12.input_layernorm.bias lr_decay_rate 0.2824295364810001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.self_attention.linear_qkv.weight key (1.0, 0.028242953648100012, False, False)name module.module.external_feature_model.vit.decoder.layers.12.mlp.linear_fc2.bias lr_decay_rate 0.2824295364810001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.pre_mlp_layernorm.bias key (0.0, 0.031381059609000006, False, False) name module.module.external_feature_model.vit.decoder.layers.17.mlp.linear_fc1.bias lr_decay_rate 0.4782969000000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.ls2 key (0.0, 0.012157665459056936, False, False) name module.module.external_feature_model.vit.decoder.layers.10.self_attention.linear_qkv.weight lr_decay_rate 0.2287679245496101_get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.mlp.linear_fc2.weight key (1.0, 0.028242953648100012, False, False)name module.module.external_feature_model.vit.decoder.layers.3.self_attention.linear_qkv.bias lr_decay_rate 0.10941898913151242 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.ls1 key (0.0, 0.02541865828329001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.mlp.linear_fc2.bias key (0.0, 0.031381059609000006, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.input_layernorm.bias key (0.0, 0.028242953648100012, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.mlp.linear_fc2.bias key (0.0, 0.028242953648100012, False, False)name module.module.external_feature_model.vit.decoder.layers.12.self_attention.linear_qkv.bias lr_decay_rate 0.2824295364810001 name module.module.external_feature_model.vit.decoder.layers.13.mlp.linear_fc2.weight lr_decay_rate 0.31381059609000006 name module.module.external_feature_model.vit.decoder.layers.13.mlp.linear_fc1.weight lr_decay_rate 0.31381059609000006 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.mlp.linear_fc1.bias key (0.0, 0.04782969000000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.self_attention.linear_qkv.weight key (1.0, 0.02287679245496101, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.self_attention.linear_qkv.bias key (0.0, 0.010941898913151242, False, False) name module.module.external_feature_model.vit.decoder.layers.4.input_layernorm.weight lr_decay_rate 0.12157665459056935name module.module.external_feature_model.vit.decoder.layers.12.mlp.linear_fc2.bias lr_decay_rate 0.2824295364810001 name module.module.external_feature_model.vit.decoder.layers.11.ls2 lr_decay_rate 0.2541865828329001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.self_attention.linear_qkv.bias key (0.0, 0.028242953648100012, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.mlp.linear_fc2.weight key (1.0, 0.031381059609000006, False, False)name module.module.external_feature_model.vit.decoder.layers.13.ls1 lr_decay_rate 0.31381059609000006_get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.mlp.linear_fc1.weight key (1.0, 0.031381059609000006, False, False) name module.module.external_feature_model.vit.decoder.layers.12.self_attention.linear_proj.weight lr_decay_rate 0.2824295364810001 name module.module.external_feature_model.vit.decoder.layers.14.ls1 lr_decay_rate 0.3486784401000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.input_layernorm.weight key (0.0, 0.012157665459056936, False, False)name module.module.external_feature_model.vit.decoder.layers.17.mlp.linear_fc2.weight lr_decay_rate 0.4782969000000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.mlp.linear_fc2.bias key (0.0, 0.028242953648100012, False, False) name module.module.external_feature_model.vit.decoder.layers.3.pre_mlp_layernorm.weight lr_decay_rate 0.10941898913151242name module.module.external_feature_model.vit.decoder.layers.10.self_attention.linear_qkv.bias lr_decay_rate 0.2287679245496101 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.ls2 key (0.0, 0.02541865828329001, False, False)name module.module.external_feature_model.vit.decoder.layers.13.mlp.linear_fc2.bias lr_decay_rate 0.31381059609000006 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.ls1 key (0.0, 0.031381059609000006, False, False) name module.module.external_feature_model.vit.decoder.layers.13.mlp.linear_fc1.bias lr_decay_rate 0.31381059609000006_get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.self_attention.linear_proj.weight key (1.0, 0.028242953648100012, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.ls1 key (0.0, 0.03486784401000001, False, False)name module.module.external_feature_model.vit.decoder.layers.12.pre_mlp_layernorm.weight lr_decay_rate 0.2824295364810001 name module.module.external_feature_model.vit.decoder.layers.4.input_layernorm.bias lr_decay_rate 0.12157665459056935 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.mlp.linear_fc2.weight key (1.0, 0.04782969000000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.mlp.linear_fc2.bias key (0.0, 0.031381059609000006, False, False)name module.module.external_feature_model.vit.decoder.layers.11.input_layernorm.weight lr_decay_rate 0.2541865828329001name module.module.external_feature_model.vit.decoder.layers.13.ls1 lr_decay_rate 0.31381059609000006_get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.pre_mlp_layernorm.weight key (0.0, 0.010941898913151242, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.self_attention.linear_qkv.bias key (0.0, 0.02287679245496101, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.mlp.linear_fc1.bias key (0.0, 0.031381059609000006, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.pre_mlp_layernorm.weight key (0.0, 0.028242953648100012, False, False)name module.module.external_feature_model.vit.decoder.layers.14.ls2 lr_decay_rate 0.3486784401000001 name module.module.external_feature_model.vit.decoder.layers.12.self_attention.linear_proj.bias lr_decay_rate 0.2824295364810001name module.module.external_feature_model.vit.decoder.layers.13.ls2 lr_decay_rate 0.31381059609000006_get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.input_layernorm.bias key (0.0, 0.012157665459056936, False, False) name module.module.external_feature_model.vit.decoder.layers.17.mlp.linear_fc2.bias lr_decay_rate 0.4782969000000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.input_layernorm.weight key (0.0, 0.02541865828329001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.ls1 key (0.0, 0.031381059609000006, False, False)name module.module.external_feature_model.vit.decoder.layers.3.pre_mlp_layernorm.bias lr_decay_rate 0.10941898913151242name module.module.external_feature_model.vit.decoder.layers.14.ls1 lr_decay_rate 0.3486784401000001 name module.module.external_feature_model.vit.decoder.layers.13.mlp.linear_fc2.weight lr_decay_rate 0.31381059609000006 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.ls2 key (0.0, 0.03486784401000001, False, False)name module.module.external_feature_model.vit.decoder.layers.12.pre_mlp_layernorm.bias lr_decay_rate 0.2824295364810001name module.module.external_feature_model.vit.decoder.layers.10.pre_mlp_layernorm.weight lr_decay_rate 0.2287679245496101 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.mlp.linear_fc2.bias key (0.0, 0.04782969000000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.ls2 key (0.0, 0.031381059609000006, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.self_attention.linear_proj.bias key (0.0, 0.028242953648100012, False, False) name module.module.external_feature_model.vit.decoder.layers.11.input_layernorm.bias lr_decay_rate 0.2541865828329001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.pre_mlp_layernorm.bias key (0.0, 0.010941898913151242, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.ls1 key (0.0, 0.03486784401000001, False, False)name module.module.external_feature_model.vit.decoder.layers.13.ls2 lr_decay_rate 0.31381059609000006 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.mlp.linear_fc2.weight key (1.0, 0.031381059609000006, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.pre_mlp_layernorm.bias key (0.0, 0.028242953648100012, False, False) name module.module.external_feature_model.vit.decoder.layers.4.self_attention.linear_proj.weight lr_decay_rate 0.12157665459056935 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.pre_mlp_layernorm.weight key (0.0, 0.02287679245496101, False, False)name module.module.external_feature_model.vit.decoder.layers.14.input_layernorm.weight lr_decay_rate 0.3486784401000001 name module.module.external_feature_model.vit.decoder.layers.18.ls1 lr_decay_rate 0.531441 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.input_layernorm.bias key (0.0, 0.02541865828329001, False, False)name module.module.external_feature_model.vit.decoder.layers.12.self_attention.linear_qkv.weight lr_decay_rate 0.2824295364810001name module.module.external_feature_model.vit.decoder.layers.13.input_layernorm.weight lr_decay_rate 0.31381059609000006name module.module.external_feature_model.vit.decoder.layers.13.mlp.linear_fc2.bias lr_decay_rate 0.31381059609000006_get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.ls2 key (0.0, 0.031381059609000006, False, False) name module.module.external_feature_model.vit.decoder.layers.14.ls2 lr_decay_rate 0.3486784401000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.self_attention.linear_proj.weight key (1.0, 0.012157665459056936, False, False)name module.module.external_feature_model.vit.decoder.layers.3.mlp.linear_fc1.weight lr_decay_rate 0.10941898913151242_get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.input_layernorm.weight key (0.0, 0.03486784401000001, False, False) name module.module.external_feature_model.vit.decoder.layers.12.mlp.linear_fc1.weight lr_decay_rate 0.2824295364810001name module.module.external_feature_model.vit.decoder.layers.10.pre_mlp_layernorm.bias lr_decay_rate 0.2287679245496101_get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.ls1 key (0.0, 0.05314410000000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.mlp.linear_fc2.bias key (0.0, 0.031381059609000006, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.input_layernorm.weight key (0.0, 0.031381059609000006, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.self_attention.linear_qkv.weight key (1.0, 0.028242953648100012, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.ls2 key (0.0, 0.03486784401000001, False, False) name module.module.external_feature_model.vit.decoder.layers.13.input_layernorm.weight lr_decay_rate 0.31381059609000006name module.module.external_feature_model.vit.decoder.layers.11.self_attention.linear_proj.weight lr_decay_rate 0.2541865828329001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.mlp.linear_fc1.weight key (1.0, 0.010941898913151242, False, False) name module.module.external_feature_model.vit.decoder.layers.4.self_attention.linear_proj.bias lr_decay_rate 0.12157665459056935 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.mlp.linear_fc1.weight key (1.0, 0.028242953648100012, False, False) name module.module.external_feature_model.vit.decoder.layers.18.ls2 lr_decay_rate 0.531441name module.module.external_feature_model.vit.decoder.layers.14.input_layernorm.bias lr_decay_rate 0.3486784401000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.pre_mlp_layernorm.bias key (0.0, 0.02287679245496101, False, False)name module.module.external_feature_model.vit.decoder.layers.12.self_attention.linear_qkv.bias lr_decay_rate 0.2824295364810001 name module.module.external_feature_model.vit.decoder.layers.13.input_layernorm.bias lr_decay_rate 0.31381059609000006 name module.module.external_feature_model.vit.decoder.layers.14.ls1 lr_decay_rate 0.3486784401000001 name module.module.external_feature_model.vit.decoder.layers.14.input_layernorm.weight lr_decay_rate 0.3486784401000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.self_attention.linear_proj.weight key (1.0, 0.02541865828329001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.input_layernorm.weight key (0.0, 0.031381059609000006, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.self_attention.linear_proj.bias key (0.0, 0.012157665459056936, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.input_layernorm.bias key (0.0, 0.03486784401000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.self_attention.linear_qkv.bias key (0.0, 0.028242953648100012, False, False)name module.module.external_feature_model.vit.decoder.layers.3.mlp.linear_fc1.bias lr_decay_rate 0.10941898913151242_get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.ls2 key (0.0, 0.05314410000000001, False, False)name module.module.external_feature_model.vit.decoder.layers.12.mlp.linear_fc1.bias lr_decay_rate 0.2824295364810001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.input_layernorm.bias key (0.0, 0.031381059609000006, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.input_layernorm.weight key (0.0, 0.03486784401000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.ls1 key (0.0, 0.03486784401000001, False, False)name module.module.external_feature_model.vit.decoder.layers.11.self_attention.linear_proj.bias lr_decay_rate 0.2541865828329001 name module.module.external_feature_model.vit.class_token lr_decay_rate 1.0name module.module.external_feature_model.vit.decoder.layers.10.mlp.linear_fc1.weight lr_decay_rate 0.2287679245496101name module.module.external_feature_model.vit.decoder.layers.13.input_layernorm.bias lr_decay_rate 0.31381059609000006 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.mlp.linear_fc1.bias key (0.0, 0.028242953648100012, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.mlp.linear_fc1.bias key (0.0, 0.010941898913151242, False, False) name module.module.external_feature_model.vit.decoder.layers.4.self_attention.linear_qkv.weight lr_decay_rate 0.12157665459056935name module.module.external_feature_model.vit.decoder.layers.18.input_layernorm.weight lr_decay_rate 0.531441 name module.module.external_feature_model.vit.decoder.layers.14.input_layernorm.bias lr_decay_rate 0.3486784401000001name module.module.external_feature_model.vit.decoder.layers.14.self_attention.linear_proj.weight lr_decay_rate 0.3486784401000001name module.module.external_feature_model.vit.decoder.layers.12.pre_mlp_layernorm.weight lr_decay_rate 0.2824295364810001 name module.module.external_feature_model.vit.decoder.layers.14.ls2 lr_decay_rate 0.3486784401000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.input_layernorm.bias key (0.0, 0.031381059609000006, False, False) name module.module.external_feature_model.vit.decoder.layers.13.self_attention.linear_proj.weight lr_decay_rate 0.31381059609000006_get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.self_attention.linear_proj.bias key (0.0, 0.02541865828329001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.mlp.linear_fc1.weight key (1.0, 0.02287679245496101, False, False) name module.module.external_feature_model.vit.decoder.layers.12.mlp.linear_fc2.weight lr_decay_rate 0.2824295364810001name module.module.external_feature_model.vit.decoder.layers.3.mlp.linear_fc2.weight lr_decay_rate 0.10941898913151242_get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.input_layernorm.weight key (0.0, 0.05314410000000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.self_attention.linear_qkv.weight key (1.0, 0.012157665459056936, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.input_layernorm.bias key (0.0, 0.03486784401000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.ls2 key (0.0, 0.03486784401000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.pre_mlp_layernorm.weight key (0.0, 0.028242953648100012, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.self_attention.linear_proj.weight key (1.0, 0.03486784401000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.self_attention.linear_proj.weight key (1.0, 0.031381059609000006, False, False) name module.module.external_feature_model.vit.decoder.layers.10.mlp.linear_fc1.bias lr_decay_rate 0.2287679245496101 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.mlp.linear_fc2.weight key (1.0, 0.028242953648100012, False, False)name module.module.external_feature_model.vit.decoder.layers.11.self_attention.linear_qkv.weight lr_decay_rate 0.2541865828329001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.mlp.linear_fc2.weight key (1.0, 0.010941898913151242, False, False) name module.module.external_feature_model.vit.decoder.layers.4.self_attention.linear_qkv.bias lr_decay_rate 0.12157665459056935name module.module.external_feature_model.vit.decoder.layers.18.input_layernorm.bias lr_decay_rate 0.531441 name module.module.external_feature_model.vit.decoder.layers.13.self_attention.linear_proj.weight lr_decay_rate 0.31381059609000006 name module.module.external_feature_model.vit.decoder.layers.12.pre_mlp_layernorm.bias lr_decay_rate 0.2824295364810001 name module.module.external_feature_model.vit.decoder.layers.14.input_layernorm.weight lr_decay_rate 0.3486784401000001name module.module.external_feature_model.vit.decoder.layers.14.self_attention.linear_proj.bias lr_decay_rate 0.3486784401000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.mlp.linear_fc1.bias key (0.0, 0.02287679245496101, False, False)name module.module.external_feature_model.vit.decoder.layers.14.self_attention.linear_proj.weight lr_decay_rate 0.3486784401000001 name module.module.external_feature_model.vit.decoder.layers.13.self_attention.linear_proj.bias lr_decay_rate 0.31381059609000006 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.self_attention.linear_qkv.weight key (1.0, 0.02541865828329001, False, False) name module.module.external_feature_model.vit.decoder.layers.3.mlp.linear_fc2.bias lr_decay_rate 0.10941898913151242name module.module.external_feature_model.vit.decoder.layers.12.mlp.linear_fc2.bias lr_decay_rate 0.2824295364810001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.self_attention.linear_qkv.bias key (0.0, 0.012157665459056936, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.input_layernorm.bias key (0.0, 0.05314410000000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.pre_mlp_layernorm.bias key (0.0, 0.028242953648100012, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.self_attention.linear_proj.weight key (1.0, 0.031381059609000006, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.input_layernorm.weight key (0.0, 0.03486784401000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.mlp.linear_fc2.bias key (0.0, 0.010941898913151242, False, False)name module.module.external_feature_model.vit.decoder.layers.10.mlp.linear_fc2.weight lr_decay_rate 0.2287679245496101_get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.self_attention.linear_proj.bias key (0.0, 0.03486784401000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.self_attention.linear_proj.weight key (1.0, 0.03486784401000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.self_attention.linear_proj.bias key (0.0, 0.031381059609000006, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.mlp.linear_fc2.bias key (0.0, 0.028242953648100012, False, False) name module.module.external_feature_model.vit.decoder.layers.11.self_attention.linear_qkv.bias lr_decay_rate 0.2541865828329001 name module.module.external_feature_model.vit.decoder.layers.18.self_attention.linear_proj.weight lr_decay_rate 0.531441 name module.module.external_feature_model.vit.decoder.layers.12.mlp.linear_fc1.weight lr_decay_rate 0.2824295364810001name module.module.external_feature_model.vit.decoder.layers.13.self_attention.linear_proj.bias lr_decay_rate 0.31381059609000006 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.mlp.linear_fc2.weight key (1.0, 0.02287679245496101, False, False)name module.module.external_feature_model.vit.decoder.layers.4.pre_mlp_layernorm.weight lr_decay_rate 0.12157665459056935 name module.module.external_feature_model.vit.decoder.layers.14.input_layernorm.bias lr_decay_rate 0.3486784401000001 name module.module.external_feature_model.vit.decoder.layers.4.ls1 lr_decay_rate 0.12157665459056935_get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.self_attention.linear_qkv.bias key (0.0, 0.02541865828329001, False, False)name module.module.external_feature_model.vit.decoder.layers.13.self_attention.linear_qkv.weight lr_decay_rate 0.31381059609000006 name module.module.external_feature_model.vit.decoder.layers.14.self_attention.linear_qkv.weight lr_decay_rate 0.3486784401000001 name module.module.external_feature_model.vit.decoder.layers.14.self_attention.linear_proj.bias lr_decay_rate 0.3486784401000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.self_attention.linear_proj.weight key (1.0, 0.05314410000000001, False, False)name module.module.external_feature_model.vit.decoder.layers.13.ls1 lr_decay_rate 0.31381059609000006_get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.mlp.linear_fc1.weight key (1.0, 0.028242953648100012, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.self_attention.linear_proj.bias key (0.0, 0.031381059609000006, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.self_attention.linear_qkv.weight key (1.0, 0.031381059609000006, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.pre_mlp_layernorm.weight key (0.0, 0.012157665459056936, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.input_layernorm.bias key (0.0, 0.03486784401000001, False, False) name module.module.external_feature_model.vit.decoder.layers.10.mlp.linear_fc2.bias lr_decay_rate 0.2287679245496101 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.ls1 key (0.0, 0.012157665459056936, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.self_attention.linear_qkv.weight key (1.0, 0.03486784401000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.self_attention.linear_proj.bias key (0.0, 0.03486784401000001, False, False)name module.module.external_feature_model.vit.decoder.layers.11.pre_mlp_layernorm.weight lr_decay_rate 0.2541865828329001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.ls1 key (0.0, 0.031381059609000006, False, False) name module.module.external_feature_model.vit.decoder.layers.18.self_attention.linear_proj.bias lr_decay_rate 0.531441name module.module.external_feature_model.vit.decoder.layers.12.mlp.linear_fc1.bias lr_decay_rate 0.2824295364810001 name module.module.external_feature_model.vit.decoder.layers.13.self_attention.linear_qkv.bias lr_decay_rate 0.31381059609000006name module.module.external_feature_model.vit.decoder.layers.13.self_attention.linear_qkv.weight lr_decay_rate 0.31381059609000006 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.mlp.linear_fc2.bias key (0.0, 0.02287679245496101, False, False)name module.module.external_feature_model.vit.decoder.layers.4.pre_mlp_layernorm.bias lr_decay_rate 0.12157665459056935 name module.module.external_feature_model.vit.decoder.layers.14.self_attention.linear_qkv.bias lr_decay_rate 0.3486784401000001name module.module.external_feature_model.vit.decoder.layers.14.self_attention.linear_proj.weight lr_decay_rate 0.3486784401000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.pre_mlp_layernorm.weight key (0.0, 0.02541865828329001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.self_attention.linear_proj.bias key (0.0, 0.05314410000000001, False, False) name module.module.external_feature_model.vit.decoder.layers.4.ls2 lr_decay_rate 0.12157665459056935 name module.module.external_feature_model.vit.decoder.layers.14.self_attention.linear_qkv.weight lr_decay_rate 0.3486784401000001name module.module.external_feature_model.vit.decoder.layers.13.ls2 lr_decay_rate 0.31381059609000006 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.self_attention.linear_qkv.bias key (0.0, 0.031381059609000006, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.mlp.linear_fc1.bias key (0.0, 0.028242953648100012, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.self_attention.linear_qkv.weight key (1.0, 0.031381059609000006, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.pre_mlp_layernorm.bias key (0.0, 0.012157665459056936, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.self_attention.linear_qkv.bias key (0.0, 0.03486784401000001, False, False)name module.module.external_feature_model.vit.decoder.layers.11.ls1 lr_decay_rate 0.2541865828329001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.self_attention.linear_proj.weight key (1.0, 0.03486784401000001, False, False)name module.module.external_feature_model.vit.decoder.layers.11.pre_mlp_layernorm.bias lr_decay_rate 0.2541865828329001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.ls2 key (0.0, 0.031381059609000006, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.ls2 key (0.0, 0.012157665459056936, False, False)name module.module.external_feature_model.vit.decoder.layers.18.self_attention.linear_qkv.weight lr_decay_rate 0.531441_get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.self_attention.linear_qkv.weight key (1.0, 0.03486784401000001, False, False) name module.module.external_feature_model.vit.decoder.layers.13.self_attention.linear_qkv.bias lr_decay_rate 0.31381059609000006name module.module.external_feature_model.vit.decoder.layers.12.mlp.linear_fc2.weight lr_decay_rate 0.2824295364810001 name module.module.external_feature_model.vit.decoder.layers.13.pre_mlp_layernorm.weight lr_decay_rate 0.31381059609000006name module.module.external_feature_model.vit.decoder.layers.4.mlp.linear_fc1.weight lr_decay_rate 0.12157665459056935 _get_param_groups name module.module.external_feature_model.vit.class_token key (1.0, 0.1, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.ls1 key (0.0, 0.02541865828329001, False, False)name module.module.external_feature_model.vit.decoder.layers.14.self_attention.linear_proj.bias lr_decay_rate 0.3486784401000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.pre_mlp_layernorm.bias key (0.0, 0.02541865828329001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.self_attention.linear_qkv.weight key (1.0, 0.05314410000000001, False, False) name module.module.external_feature_model.vit.decoder.layers.14.pre_mlp_layernorm.weight lr_decay_rate 0.3486784401000001name module.module.external_feature_model.vit.decoder.layers.14.self_attention.linear_qkv.bias lr_decay_rate 0.3486784401000001name module.module.external_feature_model.vit.decoder.layers.13.input_layernorm.weight lr_decay_rate 0.31381059609000006 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.self_attention.linear_qkv.bias key (0.0, 0.031381059609000006, False, False)name module.module.external_feature_model.vit.decoder.layers.4.input_layernorm.weight lr_decay_rate 0.12157665459056935_get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.mlp.linear_fc2.weight key (1.0, 0.028242953648100012, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.mlp.linear_fc1.weight key (1.0, 0.012157665459056936, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.pre_mlp_layernorm.weight key (0.0, 0.031381059609000006, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.self_attention.linear_proj.bias key (0.0, 0.03486784401000001, False, False) name module.module.external_feature_model.vit.decoder.layers.11.ls2 lr_decay_rate 0.2541865828329001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.self_attention.linear_qkv.bias key (0.0, 0.03486784401000001, False, False)name module.module.external_feature_model.vit.decoder.layers.11.mlp.linear_fc1.weight lr_decay_rate 0.2541865828329001 name module.module.external_feature_model.vit.decoder.layers.18.self_attention.linear_qkv.bias lr_decay_rate 0.531441 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.input_layernorm.weight key (0.0, 0.031381059609000006, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.input_layernorm.weight key (0.0, 0.012157665459056936, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.pre_mlp_layernorm.weight key (0.0, 0.03486784401000001, False, False) name module.module.external_feature_model.vit.decoder.layers.12.mlp.linear_fc2.bias lr_decay_rate 0.2824295364810001name module.module.external_feature_model.vit.decoder.layers.14.self_attention.linear_qkv.weight lr_decay_rate 0.3486784401000001name module.module.external_feature_model.vit.decoder.layers.4.mlp.linear_fc1.bias lr_decay_rate 0.12157665459056935 name module.module.external_feature_model.vit.decoder.layers.13.pre_mlp_layernorm.bias lr_decay_rate 0.31381059609000006_get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.ls2 key (0.0, 0.02541865828329001, False, False)name module.module.external_feature_model.vit.decoder.layers.13.pre_mlp_layernorm.weight lr_decay_rate 0.31381059609000006_get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.mlp.linear_fc1.weight key (1.0, 0.02541865828329001, False, False)name module.module.external_feature_model.vit.conv1.weight lr_decay_rate 0.0717897987691853 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.self_attention.linear_qkv.bias key (0.0, 0.05314410000000001, False, False) name module.module.external_feature_model.vit.decoder.layers.13.input_layernorm.bias lr_decay_rate 0.31381059609000006name module.module.external_feature_model.vit.decoder.layers.4.input_layernorm.bias lr_decay_rate 0.12157665459056935 name module.module.external_feature_model.vit.decoder.layers.14.pre_mlp_layernorm.bias lr_decay_rate 0.3486784401000001name module.module.external_feature_model.vit.decoder.layers.14.pre_mlp_layernorm.weight lr_decay_rate 0.3486784401000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.mlp.linear_fc2.bias key (0.0, 0.028242953648100012, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.pre_mlp_layernorm.bias key (0.0, 0.031381059609000006, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.self_attention.linear_qkv.weight key (1.0, 0.03486784401000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.mlp.linear_fc1.bias key (0.0, 0.012157665459056936, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.pre_mlp_layernorm.weight key (0.0, 0.031381059609000006, False, False)name module.module.external_feature_model.vit.decoder.layers.11.input_layernorm.weight lr_decay_rate 0.2541865828329001name module.module.external_feature_model.vit.decoder.layers.11.mlp.linear_fc1.bias lr_decay_rate 0.2541865828329001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.input_layernorm.bias key (0.0, 0.031381059609000006, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.pre_mlp_layernorm.bias key (0.0, 0.03486784401000001, False, False)_get_param_groups name module.module.external_feature_model.vit.conv1.weight key (1.0, 0.00717897987691853, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.input_layernorm.bias key (0.0, 0.012157665459056936, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.pre_mlp_layernorm.weight key (0.0, 0.03486784401000001, False, False)name module.module.external_feature_model.vit.decoder.layers.18.pre_mlp_layernorm.weight lr_decay_rate 0.531441 name module.module.external_feature_model.vit.decoder.layers.14.self_attention.linear_qkv.bias lr_decay_rate 0.3486784401000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.mlp.linear_fc1.bias key (0.0, 0.02541865828329001, False, False)name module.module.external_feature_model.vit.decoder.layers.13.ls1 lr_decay_rate 0.31381059609000006 name module.module.external_feature_model.vit.decoder.layers.13.mlp.linear_fc1.weight lr_decay_rate 0.31381059609000006name module.module.external_feature_model.vit.decoder.layers.4.mlp.linear_fc2.weight lr_decay_rate 0.12157665459056935_get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.input_layernorm.weight key (0.0, 0.02541865828329001, False, False)name module.module.external_feature_model.vit.decoder.layers.13.pre_mlp_layernorm.bias lr_decay_rate 0.31381059609000006 name module.module.external_feature_model.vit.decoder.layers.14.pre_mlp_layernorm.bias lr_decay_rate 0.3486784401000001name module.module.external_feature_model.vit.conv1.bias lr_decay_rate 0.0717897987691853name module.module.external_feature_model.vit.decoder.layers.14.mlp.linear_fc1.weight lr_decay_rate 0.3486784401000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.pre_mlp_layernorm.weight key (0.0, 0.05314410000000001, False, False)name module.module.external_feature_model.vit.decoder.layers.13.self_attention.linear_proj.weight lr_decay_rate 0.31381059609000006 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.self_attention.linear_qkv.bias key (0.0, 0.03486784401000001, False, False) name module.module.external_feature_model.vit.decoder.layers.11.mlp.linear_fc2.weight lr_decay_rate 0.2541865828329001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.mlp.linear_fc1.weight key (1.0, 0.031381059609000006, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.ls1 key (0.0, 0.031381059609000006, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.mlp.linear_fc2.weight key (1.0, 0.012157665459056936, False, False)name module.module.external_feature_model.vit.decoder.layers.4.self_attention.linear_proj.weight lr_decay_rate 0.12157665459056935_get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.pre_mlp_layernorm.bias key (0.0, 0.031381059609000006, False, False) name module.module.external_feature_model.vit.decoder.layers.11.input_layernorm.bias lr_decay_rate 0.2541865828329001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.pre_mlp_layernorm.bias key (0.0, 0.03486784401000001, False, False) _get_param_groups name module.module.external_feature_model.vit.conv1.bias key (0.0, 0.00717897987691853, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.self_attention.linear_proj.weight key (1.0, 0.031381059609000006, False, False)name module.module.external_feature_model.vit.decoder.layers.18.pre_mlp_layernorm.bias lr_decay_rate 0.531441_get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.mlp.linear_fc1.weight key (1.0, 0.03486784401000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.mlp.linear_fc2.weight key (1.0, 0.02541865828329001, False, False)name module.module.external_feature_model.vit.decoder.layers.14.pre_mlp_layernorm.weight lr_decay_rate 0.3486784401000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.input_layernorm.bias key (0.0, 0.02541865828329001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.self_attention.linear_proj.weight key (1.0, 0.012157665459056936, False, False)name module.module.external_feature_model.vit.decoder.layers.13.ls2 lr_decay_rate 0.31381059609000006 name module.module.external_feature_model.vit.decoder.layers.13.mlp.linear_fc1.bias lr_decay_rate 0.31381059609000006 name module.module.external_feature_model.vit.decoder.layers.4.mlp.linear_fc2.bias lr_decay_rate 0.12157665459056935 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.pre_mlp_layernorm.bias key (0.0, 0.05314410000000001, False, False) name module.module.external_feature_model.vit.decoder.layers.13.mlp.linear_fc1.weight lr_decay_rate 0.31381059609000006name module.module.external_feature_model.vit.decoder.layers.14.mlp.linear_fc1.weight lr_decay_rate 0.3486784401000001 name module.module.external_feature_model.vit.decoder.layers.13.self_attention.linear_proj.bias lr_decay_rate 0.31381059609000006 name module.module.external_feature_model.vit.decoder.layers.14.mlp.linear_fc1.bias lr_decay_rate 0.3486784401000001name module.module.external_feature_model.vit.position_embeddings.weight lr_decay_rate 0.0717897987691853 name module.module.external_feature_model.vit.decoder.layers.11.mlp.linear_fc2.bias lr_decay_rate 0.2541865828329001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.pre_mlp_layernorm.weight key (0.0, 0.03486784401000001, False, False) name module.module.external_feature_model.vit.decoder.layers.4.self_attention.linear_proj.bias lr_decay_rate 0.12157665459056935_get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.mlp.linear_fc1.bias key (0.0, 0.031381059609000006, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.mlp.linear_fc2.bias key (0.0, 0.012157665459056936, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.ls2 key (0.0, 0.031381059609000006, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.mlp.linear_fc1.weight key (1.0, 0.03486784401000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.mlp.linear_fc1.weight key (1.0, 0.031381059609000006, False, False)name module.module.external_feature_model.vit.decoder.layers.11.self_attention.linear_proj.weight lr_decay_rate 0.2541865828329001name module.module.external_feature_model.vit.decoder.layers.18.mlp.linear_fc1.weight lr_decay_rate 0.531441_get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.self_attention.linear_proj.bias key (0.0, 0.031381059609000006, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.mlp.linear_fc2.bias key (0.0, 0.02541865828329001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.mlp.linear_fc1.bias key (0.0, 0.03486784401000001, False, False) _get_param_groups name module.module.external_feature_model.vit.position_embeddings.weight key (1.0, 0.00717897987691853, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.self_attention.linear_proj.bias key (0.0, 0.012157665459056936, False, False)name module.module.external_feature_model.vit.decoder.layers.13.mlp.linear_fc2.weight lr_decay_rate 0.31381059609000006 name module.module.external_feature_model.vit.decoder.layers.14.pre_mlp_layernorm.bias lr_decay_rate 0.3486784401000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.mlp.linear_fc1.weight key (1.0, 0.05314410000000001, False, False) name module.module.external_feature_model.vit.decoder.layers.13.input_layernorm.weight lr_decay_rate 0.31381059609000006name module.module.external_feature_model.vit.decoder.layers.5.ls1 lr_decay_rate 0.13508517176729928 name module.module.external_feature_model.vit.decoder.layers.14.mlp.linear_fc1.bias lr_decay_rate 0.3486784401000001 name module.module.external_feature_model.vit.decoder.layers.13.mlp.linear_fc1.bias lr_decay_rate 0.31381059609000006_get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.self_attention.linear_proj.weight key (1.0, 0.02541865828329001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.mlp.linear_fc2.weight key (1.0, 0.031381059609000006, False, False)name module.module.external_feature_model.vit.decoder.layers.13.self_attention.linear_qkv.weight lr_decay_rate 0.31381059609000006 name module.module.external_feature_model.vit.decoder.layers.4.self_attention.linear_qkv.weight lr_decay_rate 0.12157665459056935_get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.pre_mlp_layernorm.bias key (0.0, 0.03486784401000001, False, False) name module.module.external_feature_model.vit.decoder.layers.14.mlp.linear_fc2.weight lr_decay_rate 0.3486784401000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.input_layernorm.weight key (0.0, 0.031381059609000006, False, False) name module.module.external_feature_model.vit.decoder.layers.12.ls1 lr_decay_rate 0.2824295364810001 name module.module.external_feature_model.vit.decoder.layers.18.mlp.linear_fc1.bias lr_decay_rate 0.531441_get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.mlp.linear_fc1.bias key (0.0, 0.03486784401000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.mlp.linear_fc1.bias key (0.0, 0.031381059609000006, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.ls1 key (0.0, 0.013508517176729929, False, False) name module.module.external_feature_model.vit.decoder.layers.13.mlp.linear_fc2.bias lr_decay_rate 0.31381059609000006 name module.module.external_feature_model.vit.decoder.layers.0.ls1 lr_decay_rate 0.07976644307687256 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.self_attention.linear_qkv.weight key (1.0, 0.031381059609000006, False, False)name module.module.external_feature_model.vit.decoder.layers.11.self_attention.linear_proj.bias lr_decay_rate 0.2541865828329001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.mlp.linear_fc2.weight key (1.0, 0.03486784401000001, False, False)name module.module.external_feature_model.vit.decoder.layers.13.input_layernorm.bias lr_decay_rate 0.31381059609000006 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.self_attention.linear_qkv.weight key (1.0, 0.012157665459056936, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.mlp.linear_fc1.bias key (0.0, 0.05314410000000001, False, False)name module.module.external_feature_model.vit.decoder.layers.14.mlp.linear_fc1.weight lr_decay_rate 0.3486784401000001 name module.module.external_feature_model.vit.decoder.layers.14.mlp.linear_fc2.weight lr_decay_rate 0.3486784401000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.ls1 key (0.0, 0.028242953648100012, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.mlp.linear_fc2.bias key (0.0, 0.031381059609000006, False, False) name module.module.external_feature_model.vit.decoder.layers.13.mlp.linear_fc2.weight lr_decay_rate 0.31381059609000006 name module.module.external_feature_model.vit.decoder.layers.5.ls2 lr_decay_rate 0.13508517176729928_get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.input_layernorm.bias key (0.0, 0.031381059609000006, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.self_attention.linear_proj.bias key (0.0, 0.02541865828329001, False, False)name module.module.external_feature_model.vit.decoder.layers.14.mlp.linear_fc2.bias lr_decay_rate 0.3486784401000001 name module.module.external_feature_model.vit.decoder.layers.13.self_attention.linear_qkv.bias lr_decay_rate 0.31381059609000006 name module.module.external_feature_model.vit.decoder.layers.4.self_attention.linear_qkv.bias lr_decay_rate 0.12157665459056935_get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.ls1 key (0.0, 0.007976644307687256, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.mlp.linear_fc1.weight key (1.0, 0.03486784401000001, False, False) name module.module.external_feature_model.vit.decoder.layers.12.ls2 lr_decay_rate 0.2824295364810001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.mlp.linear_fc2.weight key (1.0, 0.03486784401000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.ls2 key (0.0, 0.013508517176729929, False, False) name module.module.external_feature_model.vit.decoder.layers.18.mlp.linear_fc2.weight lr_decay_rate 0.531441_get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.mlp.linear_fc2.weight key (1.0, 0.031381059609000006, False, False) name module.module.external_feature_model.vit.decoder.layers.14.ls1 lr_decay_rate 0.3486784401000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.mlp.linear_fc2.bias key (0.0, 0.03486784401000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.self_attention.linear_qkv.bias key (0.0, 0.031381059609000006, False, False) name module.module.external_feature_model.vit.decoder.layers.13.self_attention.linear_proj.weight lr_decay_rate 0.31381059609000006name module.module.external_feature_model.vit.decoder.layers.11.self_attention.linear_qkv.weight lr_decay_rate 0.2541865828329001 name module.module.external_feature_model.vit.decoder.layers.14.mlp.linear_fc1.bias lr_decay_rate 0.3486784401000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.self_attention.linear_qkv.bias key (0.0, 0.012157665459056936, False, False)name module.module.external_feature_model.vit.decoder.layers.14.mlp.linear_fc2.bias lr_decay_rate 0.3486784401000001name module.module.external_feature_model.vit.decoder.layers.0.ls2 lr_decay_rate 0.07976644307687256_get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.ls2 key (0.0, 0.028242953648100012, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.mlp.linear_fc2.weight key (1.0, 0.05314410000000001, False, False)name module.module.external_feature_model.vit.decoder.layers.13.mlp.linear_fc2.bias lr_decay_rate 0.31381059609000006 name module.module.external_feature_model.vit.decoder.layers.5.input_layernorm.weight lr_decay_rate 0.13508517176729928 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.ls1 key (0.0, 0.03486784401000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.self_attention.linear_proj.weight key (1.0, 0.031381059609000006, False, False)name module.module.external_feature_model.vit.decoder.layers.15.ls1 lr_decay_rate 0.3874204890000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.self_attention.linear_qkv.weight key (1.0, 0.02541865828329001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.mlp.linear_fc1.bias key (0.0, 0.03486784401000001, False, False) name module.module.external_feature_model.vit.decoder.layers.13.pre_mlp_layernorm.weight lr_decay_rate 0.31381059609000006_get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.mlp.linear_fc2.bias key (0.0, 0.03486784401000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.mlp.linear_fc2.bias key (0.0, 0.031381059609000006, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.ls2 key (0.0, 0.007976644307687256, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.input_layernorm.weight key (0.0, 0.013508517176729929, False, False)name module.module.external_feature_model.vit.decoder.layers.12.input_layernorm.weight lr_decay_rate 0.2824295364810001 name module.module.external_feature_model.vit.decoder.layers.18.mlp.linear_fc2.bias lr_decay_rate 0.531441 name module.module.external_feature_model.vit.decoder.layers.4.pre_mlp_layernorm.weight lr_decay_rate 0.12157665459056935 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.ls1 key (0.0, 0.03874204890000001, False, False)name module.module.external_feature_model.vit.decoder.layers.14.ls2 lr_decay_rate 0.3486784401000001name module.module.external_feature_model.vit.decoder.layers.13.self_attention.linear_proj.bias lr_decay_rate 0.31381059609000006 name module.module.external_feature_model.vit.decoder.layers.11.self_attention.linear_qkv.bias lr_decay_rate 0.2541865828329001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.pre_mlp_layernorm.weight key (0.0, 0.031381059609000006, False, False) name module.module.external_feature_model.vit.decoder.layers.14.mlp.linear_fc2.weight lr_decay_rate 0.3486784401000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.mlp.linear_fc2.bias key (0.0, 0.05314410000000001, False, False)name module.module.external_feature_model.vit.decoder.layers.14.ls1 lr_decay_rate 0.3486784401000001 name module.module.external_feature_model.vit.decoder.layers.15.ls1 lr_decay_rate 0.3874204890000001name module.module.external_feature_model.vit.decoder.layers.5.input_layernorm.bias lr_decay_rate 0.13508517176729928_get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.input_layernorm.weight key (0.0, 0.028242953648100012, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.ls2 key (0.0, 0.03486784401000001, False, False)name module.module.external_feature_model.vit.decoder.layers.0.input_layernorm.weight lr_decay_rate 0.07976644307687256 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.self_attention.linear_qkv.bias key (0.0, 0.02541865828329001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.pre_mlp_layernorm.weight key (0.0, 0.012157665459056936, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.self_attention.linear_proj.bias key (0.0, 0.031381059609000006, False, False)name module.module.external_feature_model.vit.decoder.layers.13.pre_mlp_layernorm.bias lr_decay_rate 0.31381059609000006name module.module.external_feature_model.vit.decoder.layers.15.ls2 lr_decay_rate 0.3874204890000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.mlp.linear_fc2.weight key (1.0, 0.03486784401000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.input_layernorm.bias key (0.0, 0.013508517176729929, False, False)name module.module.external_feature_model.vit.decoder.layers.19.ls1 lr_decay_rate 0.5904900000000001name module.module.external_feature_model.vit.decoder.layers.12.input_layernorm.bias lr_decay_rate 0.2824295364810001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.ls1 key (0.0, 0.03486784401000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.ls1 key (0.0, 0.03874204890000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.ls2 key (0.0, 0.03874204890000001, False, False)name module.module.external_feature_model.vit.decoder.layers.4.pre_mlp_layernorm.bias lr_decay_rate 0.12157665459056935_get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.input_layernorm.weight key (0.0, 0.007976644307687256, False, False) name module.module.external_feature_model.vit.decoder.layers.14.input_layernorm.weight lr_decay_rate 0.3486784401000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.pre_mlp_layernorm.bias key (0.0, 0.031381059609000006, False, False)name module.module.external_feature_model.vit.decoder.layers.11.pre_mlp_layernorm.weight lr_decay_rate 0.2541865828329001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.input_layernorm.bias key (0.0, 0.028242953648100012, False, False)name module.module.external_feature_model.vit.decoder.layers.14.ls2 lr_decay_rate 0.3486784401000001 name module.module.external_feature_model.vit.decoder.layers.14.mlp.linear_fc2.bias lr_decay_rate 0.3486784401000001 name module.module.external_feature_model.vit.decoder.layers.13.self_attention.linear_qkv.weight lr_decay_rate 0.31381059609000006_get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.ls1 key (0.0, 0.05904900000000001, False, False) name module.module.external_feature_model.vit.decoder.layers.5.self_attention.linear_proj.weight lr_decay_rate 0.13508517176729928name module.module.external_feature_model.vit.decoder.layers.15.ls2 lr_decay_rate 0.3874204890000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.pre_mlp_layernorm.bias key (0.0, 0.012157665459056936, False, False)name module.module.external_feature_model.vit.decoder.layers.15.input_layernorm.weight lr_decay_rate 0.3874204890000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.pre_mlp_layernorm.weight key (0.0, 0.02541865828329001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.mlp.linear_fc2.bias key (0.0, 0.03486784401000001, False, False)name module.module.external_feature_model.vit.decoder.layers.13.mlp.linear_fc1.weight lr_decay_rate 0.31381059609000006name module.module.external_feature_model.vit.decoder.layers.0.input_layernorm.bias lr_decay_rate 0.07976644307687256_get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.input_layernorm.weight key (0.0, 0.03486784401000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.ls2 key (0.0, 0.03486784401000001, False, False)name module.module.external_feature_model.vit.decoder.layers.12.self_attention.linear_proj.weight lr_decay_rate 0.2824295364810001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.self_attention.linear_proj.weight key (1.0, 0.013508517176729929, False, False)name module.module.external_feature_model.vit.decoder.layers.19.ls2 lr_decay_rate 0.5904900000000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.ls2 key (0.0, 0.03874204890000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.self_attention.linear_qkv.weight key (1.0, 0.031381059609000006, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.input_layernorm.weight key (0.0, 0.03874204890000001, False, False) name module.module.external_feature_model.vit.decoder.layers.4.mlp.linear_fc1.weight lr_decay_rate 0.12157665459056935 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.mlp.linear_fc1.weight key (1.0, 0.031381059609000006, False, False) name module.module.external_feature_model.vit.decoder.layers.14.input_layernorm.bias lr_decay_rate 0.3486784401000001name module.module.external_feature_model.vit.decoder.layers.11.pre_mlp_layernorm.bias lr_decay_rate 0.2541865828329001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.input_layernorm.bias key (0.0, 0.007976644307687256, False, False) name module.module.external_feature_model.vit.decoder.layers.15.ls1 lr_decay_rate 0.3874204890000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.self_attention.linear_proj.weight key (1.0, 0.028242953648100012, False, False) name module.module.external_feature_model.vit.decoder.layers.14.input_layernorm.weight lr_decay_rate 0.3486784401000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.ls2 key (0.0, 0.05904900000000001, False, False) name module.module.external_feature_model.vit.decoder.layers.5.self_attention.linear_proj.bias lr_decay_rate 0.13508517176729928 name module.module.external_feature_model.vit.decoder.layers.15.input_layernorm.weight lr_decay_rate 0.3874204890000001 name module.module.external_feature_model.vit.decoder.layers.15.input_layernorm.bias lr_decay_rate 0.3874204890000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.mlp.linear_fc1.weight key (1.0, 0.012157665459056936, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.input_layernorm.bias key (0.0, 0.03486784401000001, False, False)name module.module.external_feature_model.vit.decoder.layers.13.mlp.linear_fc1.bias lr_decay_rate 0.31381059609000006name module.module.external_feature_model.vit.decoder.layers.13.self_attention.linear_qkv.bias lr_decay_rate 0.31381059609000006 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.pre_mlp_layernorm.bias key (0.0, 0.02541865828329001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.input_layernorm.weight key (0.0, 0.03486784401000001, False, False) name module.module.external_feature_model.vit.decoder.layers.0.self_attention.linear_proj.weight lr_decay_rate 0.07976644307687256_get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.ls1 key (0.0, 0.03874204890000001, False, False) name module.module.external_feature_model.vit.decoder.layers.12.self_attention.linear_proj.bias lr_decay_rate 0.2824295364810001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.input_layernorm.weight key (0.0, 0.03874204890000001, False, False)name module.module.external_feature_model.vit.decoder.layers.19.input_layernorm.weight lr_decay_rate 0.5904900000000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.self_attention.linear_qkv.bias key (0.0, 0.031381059609000006, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.self_attention.linear_proj.bias key (0.0, 0.013508517176729929, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.input_layernorm.bias key (0.0, 0.03874204890000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.mlp.linear_fc1.bias key (0.0, 0.031381059609000006, False, False)name module.module.external_feature_model.vit.decoder.layers.4.mlp.linear_fc1.bias lr_decay_rate 0.12157665459056935 name module.module.external_feature_model.vit.decoder.layers.14.input_layernorm.bias lr_decay_rate 0.3486784401000001name module.module.external_feature_model.vit.decoder.layers.11.mlp.linear_fc1.weight lr_decay_rate 0.2541865828329001name module.module.external_feature_model.vit.decoder.layers.14.self_attention.linear_proj.weight lr_decay_rate 0.3486784401000001 name module.module.external_feature_model.vit.decoder.layers.15.ls2 lr_decay_rate 0.3874204890000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.input_layernorm.weight key (0.0, 0.05904900000000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.self_attention.linear_proj.weight key (1.0, 0.007976644307687256, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.self_attention.linear_proj.bias key (0.0, 0.028242953648100012, False, False)name module.module.external_feature_model.vit.decoder.layers.15.input_layernorm.bias lr_decay_rate 0.3874204890000001 name module.module.external_feature_model.vit.decoder.layers.5.self_attention.linear_qkv.weight lr_decay_rate 0.13508517176729928_get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.mlp.linear_fc1.bias key (0.0, 0.012157665459056936, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.input_layernorm.bias key (0.0, 0.03486784401000001, False, False)name module.module.external_feature_model.vit.decoder.layers.13.mlp.linear_fc2.weight lr_decay_rate 0.31381059609000006 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.mlp.linear_fc1.weight key (1.0, 0.02541865828329001, False, False)name module.module.external_feature_model.vit.decoder.layers.15.self_attention.linear_proj.weight lr_decay_rate 0.3874204890000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.ls2 key (0.0, 0.03874204890000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.self_attention.linear_proj.weight key (1.0, 0.03486784401000001, False, False)name module.module.external_feature_model.vit.decoder.layers.13.pre_mlp_layernorm.weight lr_decay_rate 0.31381059609000006 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.self_attention.linear_qkv.weight key (1.0, 0.013508517176729929, False, False)name module.module.external_feature_model.vit.decoder.layers.19.input_layernorm.bias lr_decay_rate 0.5904900000000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.input_layernorm.bias key (0.0, 0.03874204890000001, False, False) name module.module.external_feature_model.vit.decoder.layers.4.mlp.linear_fc2.weight lr_decay_rate 0.12157665459056935 name module.module.external_feature_model.vit.decoder.layers.12.self_attention.linear_qkv.weight lr_decay_rate 0.2824295364810001 name module.module.external_feature_model.vit.decoder.layers.0.self_attention.linear_proj.bias lr_decay_rate 0.07976644307687256_get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.mlp.linear_fc2.weight key (1.0, 0.031381059609000006, False, False) name module.module.external_feature_model.vit.decoder.layers.11.mlp.linear_fc1.bias lr_decay_rate 0.2541865828329001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.self_attention.linear_proj.weight key (1.0, 0.03874204890000001, False, False) name module.module.external_feature_model.vit.decoder.layers.14.self_attention.linear_proj.weight lr_decay_rate 0.3486784401000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.mlp.linear_fc2.weight key (1.0, 0.012157665459056936, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.input_layernorm.bias key (0.0, 0.05904900000000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.pre_mlp_layernorm.weight key (0.0, 0.031381059609000006, False, False) name module.module.external_feature_model.vit.decoder.layers.15.input_layernorm.weight lr_decay_rate 0.3874204890000001name module.module.external_feature_model.vit.decoder.layers.5.self_attention.linear_qkv.bias lr_decay_rate 0.13508517176729928name module.module.external_feature_model.vit.decoder.layers.14.self_attention.linear_proj.bias lr_decay_rate 0.3486784401000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.self_attention.linear_qkv.weight key (1.0, 0.028242953648100012, False, False) name module.module.external_feature_model.vit.decoder.layers.13.mlp.linear_fc2.bias lr_decay_rate 0.31381059609000006_get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.mlp.linear_fc1.bias key (0.0, 0.02541865828329001, False, False)name module.module.external_feature_model.vit.decoder.layers.15.self_attention.linear_proj.weight lr_decay_rate 0.3874204890000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.self_attention.linear_proj.bias key (0.0, 0.007976644307687256, False, False)name module.module.external_feature_model.vit.decoder.layers.4.mlp.linear_fc2.bias lr_decay_rate 0.12157665459056935name module.module.external_feature_model.vit.decoder.layers.15.self_attention.linear_proj.bias lr_decay_rate 0.3874204890000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.self_attention.linear_proj.weight key (1.0, 0.03486784401000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.self_attention.linear_qkv.bias key (0.0, 0.013508517176729929, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.self_attention.linear_proj.bias key (0.0, 0.03486784401000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.input_layernorm.weight key (0.0, 0.03874204890000001, False, False)name module.module.external_feature_model.vit.decoder.layers.13.pre_mlp_layernorm.bias lr_decay_rate 0.31381059609000006 name module.module.external_feature_model.vit.decoder.layers.12.self_attention.linear_qkv.bias lr_decay_rate 0.2824295364810001name module.module.external_feature_model.vit.decoder.layers.19.self_attention.linear_proj.weight lr_decay_rate 0.5904900000000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.mlp.linear_fc2.bias key (0.0, 0.031381059609000006, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.self_attention.linear_proj.weight key (1.0, 0.03874204890000001, False, False)name module.module.external_feature_model.vit.decoder.layers.11.mlp.linear_fc2.weight lr_decay_rate 0.2541865828329001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.self_attention.linear_proj.bias key (0.0, 0.03874204890000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.mlp.linear_fc2.bias key (0.0, 0.012157665459056936, False, False)name module.module.external_feature_model.vit.decoder.layers.14.self_attention.linear_proj.bias lr_decay_rate 0.3486784401000001 name module.module.external_feature_model.vit.decoder.layers.15.input_layernorm.bias lr_decay_rate 0.3874204890000001 name module.module.external_feature_model.vit.decoder.layers.14.self_attention.linear_qkv.weight lr_decay_rate 0.3486784401000001name module.module.external_feature_model.vit.decoder.layers.0.self_attention.linear_qkv.weight lr_decay_rate 0.07976644307687256_get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.pre_mlp_layernorm.bias key (0.0, 0.031381059609000006, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.self_attention.linear_qkv.bias key (0.0, 0.028242953648100012, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.self_attention.linear_proj.weight key (1.0, 0.05904900000000001, False, False) name module.module.external_feature_model.vit.decoder.layers.5.pre_mlp_layernorm.weight lr_decay_rate 0.13508517176729928name module.module.external_feature_model.vit.decoder.layers.14.ls1 lr_decay_rate 0.3486784401000001 name module.module.external_feature_model.vit.decoder.layers.15.self_attention.linear_proj.bias lr_decay_rate 0.3874204890000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.mlp.linear_fc2.weight key (1.0, 0.02541865828329001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.self_attention.linear_proj.bias key (0.0, 0.03486784401000001, False, False)name module.module.external_feature_model.vit.decoder.layers.15.self_attention.linear_qkv.weight lr_decay_rate 0.3874204890000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.input_layernorm.bias key (0.0, 0.03874204890000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.self_attention.linear_qkv.weight key (1.0, 0.03486784401000001, False, False)name module.module.external_feature_model.vit.decoder.layers.5.ls1 lr_decay_rate 0.13508517176729928 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.self_attention.linear_qkv.weight key (1.0, 0.007976644307687256, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.ls1 key (0.0, 0.03486784401000001, False, False)name module.module.external_feature_model.vit.decoder.layers.13.mlp.linear_fc1.weight lr_decay_rate 0.31381059609000006 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.self_attention.linear_proj.bias key (0.0, 0.03874204890000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.pre_mlp_layernorm.weight key (0.0, 0.013508517176729929, False, False) name module.module.external_feature_model.vit.decoder.layers.12.pre_mlp_layernorm.weight lr_decay_rate 0.2824295364810001name module.module.external_feature_model.vit.decoder.layers.19.self_attention.linear_proj.bias lr_decay_rate 0.5904900000000001 name module.module.external_feature_model.vit.decoder.layers.11.mlp.linear_fc2.bias lr_decay_rate 0.2541865828329001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.self_attention.linear_qkv.weight key (1.0, 0.03874204890000001, False, False)name module.module.external_feature_model.vit.decoder.layers.14.self_attention.linear_qkv.weight lr_decay_rate 0.3486784401000001name module.module.external_feature_model.vit.decoder.layers.14.self_attention.linear_qkv.bias lr_decay_rate 0.3486784401000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.ls1 key (0.0, 0.013508517176729929, False, False) name module.module.external_feature_model.vit.decoder.layers.14.ls2 lr_decay_rate 0.3486784401000001name module.module.external_feature_model.vit.decoder.layers.0.self_attention.linear_qkv.bias lr_decay_rate 0.07976644307687256 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.self_attention.linear_proj.bias key (0.0, 0.05904900000000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.mlp.linear_fc1.weight key (1.0, 0.031381059609000006, False, False) name module.module.external_feature_model.vit.decoder.layers.15.self_attention.linear_proj.weight lr_decay_rate 0.3874204890000001 name module.module.external_feature_model.vit.decoder.layers.15.self_attention.linear_qkv.weight lr_decay_rate 0.3874204890000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.mlp.linear_fc2.bias key (0.0, 0.02541865828329001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.pre_mlp_layernorm.weight key (0.0, 0.028242953648100012, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.self_attention.linear_qkv.bias key (0.0, 0.03486784401000001, False, False)name module.module.external_feature_model.vit.decoder.layers.5.pre_mlp_layernorm.bias lr_decay_rate 0.13508517176729928 name module.module.external_feature_model.vit.decoder.layers.15.self_attention.linear_qkv.bias lr_decay_rate 0.3874204890000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.self_attention.linear_qkv.weight key (1.0, 0.03486784401000001, False, False) name module.module.external_feature_model.vit.decoder.layers.5.ls2 lr_decay_rate 0.13508517176729928_get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.ls2 key (0.0, 0.03486784401000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.self_attention.linear_qkv.bias key (0.0, 0.007976644307687256, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.self_attention.linear_qkv.weight key (1.0, 0.03874204890000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.self_attention.linear_proj.weight key (1.0, 0.03874204890000001, False, False)name module.module.external_feature_model.vit.decoder.layers.19.self_attention.linear_qkv.weight lr_decay_rate 0.5904900000000001 name module.module.external_feature_model.vit.decoder.layers.13.mlp.linear_fc1.bias lr_decay_rate 0.31381059609000006 name module.module.external_feature_model.vit.decoder.layers.12.pre_mlp_layernorm.bias lr_decay_rate 0.2824295364810001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.pre_mlp_layernorm.bias key (0.0, 0.013508517176729929, False, False) name module.module.external_feature_model.vit.decoder.layers.12.ls1 lr_decay_rate 0.2824295364810001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.self_attention.linear_qkv.bias key (0.0, 0.03874204890000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.ls2 key (0.0, 0.013508517176729929, False, False)name module.module.external_feature_model.vit.decoder.layers.14.pre_mlp_layernorm.weight lr_decay_rate 0.3486784401000001name module.module.external_feature_model.vit.decoder.layers.14.self_attention.linear_qkv.bias lr_decay_rate 0.3486784401000001 name module.module.external_feature_model.vit.decoder.layers.14.input_layernorm.weight lr_decay_rate 0.3486784401000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.self_attention.linear_qkv.weight key (1.0, 0.05904900000000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.mlp.linear_fc1.bias key (0.0, 0.031381059609000006, False, False)name module.module.external_feature_model.vit.decoder.layers.15.self_attention.linear_qkv.bias lr_decay_rate 0.3874204890000001 name module.module.external_feature_model.vit.decoder.layers.15.self_attention.linear_proj.bias lr_decay_rate 0.3874204890000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.pre_mlp_layernorm.bias key (0.0, 0.028242953648100012, False, False) name module.module.external_feature_model.vit.decoder.layers.0.pre_mlp_layernorm.weight lr_decay_rate 0.07976644307687256 name module.module.external_feature_model.vit.decoder.layers.5.mlp.linear_fc1.weight lr_decay_rate 0.13508517176729928 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.input_layernorm.weight key (0.0, 0.03486784401000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.pre_mlp_layernorm.weight key (0.0, 0.03486784401000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.ls1 key (0.0, 0.028242953648100012, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.self_attention.linear_qkv.bias key (0.0, 0.03486784401000001, False, False) name module.module.external_feature_model.vit.decoder.layers.5.input_layernorm.weight lr_decay_rate 0.13508517176729928 name module.module.external_feature_model.vit.decoder.layers.15.pre_mlp_layernorm.weight lr_decay_rate 0.3874204890000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.self_attention.linear_qkv.bias key (0.0, 0.03874204890000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.self_attention.linear_proj.bias key (0.0, 0.03874204890000001, False, False)name module.module.external_feature_model.vit.decoder.layers.19.self_attention.linear_qkv.bias lr_decay_rate 0.5904900000000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.pre_mlp_layernorm.weight key (0.0, 0.007976644307687256, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.mlp.linear_fc1.weight key (1.0, 0.013508517176729929, False, False) name module.module.external_feature_model.vit.decoder.layers.13.mlp.linear_fc2.weight lr_decay_rate 0.31381059609000006 name module.module.external_feature_model.vit.decoder.layers.12.mlp.linear_fc1.weight lr_decay_rate 0.2824295364810001 name module.module.external_feature_model.vit.decoder.layers.14.pre_mlp_layernorm.bias lr_decay_rate 0.3486784401000001name module.module.external_feature_model.vit.decoder.layers.14.input_layernorm.bias lr_decay_rate 0.3486784401000001 name module.module.external_feature_model.vit.decoder.layers.12.ls2 lr_decay_rate 0.2824295364810001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.input_layernorm.weight key (0.0, 0.013508517176729929, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.pre_mlp_layernorm.weight key (0.0, 0.03874204890000001, False, False)name module.module.external_feature_model.vit.decoder.layers.0.pre_mlp_layernorm.bias lr_decay_rate 0.07976644307687256 name module.module.external_feature_model.vit.decoder.layers.14.pre_mlp_layernorm.weight lr_decay_rate 0.3486784401000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.self_attention.linear_qkv.bias key (0.0, 0.05904900000000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.mlp.linear_fc2.weight key (1.0, 0.031381059609000006, False, False) name module.module.external_feature_model.vit.decoder.layers.5.mlp.linear_fc1.bias lr_decay_rate 0.13508517176729928name module.module.external_feature_model.vit.decoder.layers.15.self_attention.linear_qkv.weight lr_decay_rate 0.3874204890000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.input_layernorm.bias key (0.0, 0.03486784401000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.mlp.linear_fc1.weight key (1.0, 0.028242953648100012, False, False) name module.module.external_feature_model.vit.decoder.layers.15.pre_mlp_layernorm.weight lr_decay_rate 0.3874204890000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.pre_mlp_layernorm.bias key (0.0, 0.03486784401000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.pre_mlp_layernorm.bias key (0.0, 0.007976644307687256, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.ls2 key (0.0, 0.028242953648100012, False, False) name module.module.external_feature_model.vit.decoder.layers.5.input_layernorm.bias lr_decay_rate 0.13508517176729928name module.module.external_feature_model.vit.decoder.layers.15.pre_mlp_layernorm.bias lr_decay_rate 0.3874204890000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.pre_mlp_layernorm.weight key (0.0, 0.03486784401000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.mlp.linear_fc1.bias key (0.0, 0.013508517176729929, False, False) name module.module.external_feature_model.vit.decoder.layers.13.mlp.linear_fc2.bias lr_decay_rate 0.31381059609000006 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.self_attention.linear_qkv.weight key (1.0, 0.03874204890000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.pre_mlp_layernorm.weight key (0.0, 0.03874204890000001, False, False) name module.module.external_feature_model.vit.decoder.layers.12.mlp.linear_fc1.bias lr_decay_rate 0.2824295364810001name module.module.external_feature_model.vit.decoder.layers.19.pre_mlp_layernorm.weight lr_decay_rate 0.5904900000000001 name module.module.external_feature_model.vit.decoder.layers.14.self_attention.linear_proj.weight lr_decay_rate 0.3486784401000001name module.module.external_feature_model.vit.decoder.layers.14.mlp.linear_fc1.weight lr_decay_rate 0.3486784401000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.input_layernorm.bias key (0.0, 0.013508517176729929, False, False) name module.module.external_feature_model.vit.decoder.layers.0.mlp.linear_fc1.weight lr_decay_rate 0.07976644307687256 name module.module.external_feature_model.vit.decoder.layers.14.pre_mlp_layernorm.bias lr_decay_rate 0.3486784401000001name module.module.external_feature_model.vit.decoder.layers.5.mlp.linear_fc2.weight lr_decay_rate 0.13508517176729928_get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.pre_mlp_layernorm.bias key (0.0, 0.03874204890000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.mlp.linear_fc2.bias key (0.0, 0.031381059609000006, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.pre_mlp_layernorm.weight key (0.0, 0.05904900000000001, False, False)name module.module.external_feature_model.vit.decoder.layers.12.input_layernorm.weight lr_decay_rate 0.2824295364810001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.mlp.linear_fc1.weight key (1.0, 0.03486784401000001, False, False)name module.module.external_feature_model.vit.decoder.layers.15.self_attention.linear_qkv.bias lr_decay_rate 0.3874204890000001name module.module.external_feature_model.vit.decoder.layers.15.pre_mlp_layernorm.bias lr_decay_rate 0.3874204890000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.mlp.linear_fc1.bias key (0.0, 0.028242953648100012, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.self_attention.linear_proj.weight key (1.0, 0.03486784401000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.pre_mlp_layernorm.bias key (0.0, 0.03486784401000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.mlp.linear_fc2.weight key (1.0, 0.013508517176729929, False, False) name module.module.external_feature_model.vit.decoder.layers.5.self_attention.linear_proj.weight lr_decay_rate 0.13508517176729928 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.mlp.linear_fc1.weight key (1.0, 0.007976644307687256, False, False)name module.module.external_feature_model.vit.decoder.layers.19.pre_mlp_layernorm.bias lr_decay_rate 0.5904900000000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.pre_mlp_layernorm.bias key (0.0, 0.03874204890000001, False, False) name module.module.external_feature_model.vit.decoder.layers.14.mlp.linear_fc1.bias lr_decay_rate 0.3486784401000001name module.module.external_feature_model.vit.decoder.layers.12.mlp.linear_fc2.weight lr_decay_rate 0.2824295364810001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.self_attention.linear_qkv.bias key (0.0, 0.03874204890000001, False, False)name module.module.external_feature_model.vit.decoder.layers.15.mlp.linear_fc1.weight lr_decay_rate 0.3874204890000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.input_layernorm.weight key (0.0, 0.028242953648100012, False, False)name module.module.external_feature_model.vit.decoder.layers.14.ls1 lr_decay_rate 0.3486784401000001 name module.module.external_feature_model.vit.decoder.layers.5.mlp.linear_fc2.bias lr_decay_rate 0.13508517176729928 name module.module.external_feature_model.vit.decoder.layers.14.self_attention.linear_proj.bias lr_decay_rate 0.3486784401000001 name module.module.external_feature_model.vit.decoder.layers.0.mlp.linear_fc1.bias lr_decay_rate 0.07976644307687256 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.self_attention.linear_proj.weight key (1.0, 0.013508517176729929, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.pre_mlp_layernorm.bias key (0.0, 0.05904900000000001, False, False) name module.module.external_feature_model.vit.decoder.layers.15.mlp.linear_fc1.weight lr_decay_rate 0.3874204890000001name module.module.external_feature_model.vit.decoder.layers.14.mlp.linear_fc1.weight lr_decay_rate 0.3486784401000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.mlp.linear_fc2.weight key (1.0, 0.028242953648100012, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.mlp.linear_fc1.bias key (0.0, 0.03486784401000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.mlp.linear_fc1.weight key (1.0, 0.03874204890000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.ls1 key (0.0, 0.03486784401000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.mlp.linear_fc2.bias key (0.0, 0.013508517176729929, False, False)name module.module.external_feature_model.vit.decoder.layers.15.pre_mlp_layernorm.weight lr_decay_rate 0.3874204890000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.self_attention.linear_proj.bias key (0.0, 0.03486784401000001, False, False) name module.module.external_feature_model.vit.decoder.layers.12.input_layernorm.bias lr_decay_rate 0.2824295364810001name module.module.external_feature_model.vit.decoder.layers.5.self_attention.linear_proj.bias lr_decay_rate 0.13508517176729928name module.module.external_feature_model.vit.decoder.layers.19.mlp.linear_fc1.weight lr_decay_rate 0.5904900000000001 name module.module.external_feature_model.vit.decoder.layers.14.mlp.linear_fc2.weight lr_decay_rate 0.3486784401000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.mlp.linear_fc1.bias key (0.0, 0.007976644307687256, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.mlp.linear_fc1.weight key (1.0, 0.03874204890000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.mlp.linear_fc1.weight key (1.0, 0.03486784401000001, False, False) name module.module.external_feature_model.vit.decoder.layers.12.mlp.linear_fc2.bias lr_decay_rate 0.2824295364810001 name module.module.external_feature_model.vit.decoder.layers.6.ls1 lr_decay_rate 0.15009463529699918 name module.module.external_feature_model.vit.decoder.layers.14.ls2 lr_decay_rate 0.3486784401000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.pre_mlp_layernorm.weight key (0.0, 0.03874204890000001, False, False)name module.module.external_feature_model.vit.decoder.layers.15.mlp.linear_fc1.bias lr_decay_rate 0.3874204890000001 name module.module.external_feature_model.vit.decoder.layers.14.self_attention.linear_qkv.weight lr_decay_rate 0.3486784401000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.mlp.linear_fc1.weight key (1.0, 0.05904900000000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.input_layernorm.bias key (0.0, 0.028242953648100012, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.self_attention.linear_proj.bias key (0.0, 0.013508517176729929, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.mlp.linear_fc2.weight key (1.0, 0.03486784401000001, False, False) name module.module.external_feature_model.vit.decoder.layers.15.mlp.linear_fc1.bias lr_decay_rate 0.3874204890000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.mlp.linear_fc2.bias key (0.0, 0.028242953648100012, False, False)name module.module.external_feature_model.vit.decoder.layers.14.mlp.linear_fc1.bias lr_decay_rate 0.3486784401000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.ls1 key (0.0, 0.015009463529699918, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.mlp.linear_fc1.bias key (0.0, 0.03874204890000001, False, False)name module.module.external_feature_model.vit.decoder.layers.19.mlp.linear_fc1.bias lr_decay_rate 0.5904900000000001 name module.module.external_feature_model.vit.decoder.layers.0.mlp.linear_fc2.weight lr_decay_rate 0.07976644307687256_get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.self_attention.linear_qkv.weight key (1.0, 0.03486784401000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.ls2 key (0.0, 0.03486784401000001, False, False) name module.module.external_feature_model.vit.decoder.layers.15.pre_mlp_layernorm.bias lr_decay_rate 0.3874204890000001 name module.module.external_feature_model.vit.decoder.layers.14.mlp.linear_fc2.bias lr_decay_rate 0.3486784401000001 name module.module.external_feature_model.vit.decoder.layers.5.self_attention.linear_qkv.weight lr_decay_rate 0.13508517176729928 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.mlp.linear_fc1.bias key (0.0, 0.03874204890000001, False, False) name module.module.external_feature_model.vit.decoder.layers.12.self_attention.linear_proj.weight lr_decay_rate 0.2824295364810001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.mlp.linear_fc1.bias key (0.0, 0.03486784401000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.mlp.linear_fc2.weight key (1.0, 0.007976644307687256, False, False)name module.module.external_feature_model.vit.decoder.layers.13.ls1 lr_decay_rate 0.31381059609000006_get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.pre_mlp_layernorm.bias key (0.0, 0.03874204890000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.mlp.linear_fc1.bias key (0.0, 0.05904900000000001, False, False) name module.module.external_feature_model.vit.decoder.layers.14.self_attention.linear_qkv.bias lr_decay_rate 0.3486784401000001 name module.module.external_feature_model.vit.decoder.layers.6.ls2 lr_decay_rate 0.15009463529699918 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.mlp.linear_fc2.bias key (0.0, 0.03486784401000001, False, False)name module.module.external_feature_model.vit.decoder.layers.15.mlp.linear_fc2.weight lr_decay_rate 0.3874204890000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.self_attention.linear_qkv.weight key (1.0, 0.013508517176729929, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.self_attention.linear_proj.weight key (1.0, 0.028242953648100012, False, False)name module.module.external_feature_model.vit.decoder.layers.14.input_layernorm.weight lr_decay_rate 0.3486784401000001 name module.module.external_feature_model.vit.decoder.layers.15.mlp.linear_fc2.weight lr_decay_rate 0.3874204890000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.self_attention.linear_qkv.bias key (0.0, 0.03486784401000001, False, False)name module.module.external_feature_model.vit.decoder.layers.0.mlp.linear_fc2.bias lr_decay_rate 0.07976644307687256_get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.ls1 key (0.0, 0.031381059609000006, False, False)name module.module.external_feature_model.vit.decoder.layers.15.mlp.linear_fc1.weight lr_decay_rate 0.3874204890000001name module.module.external_feature_model.vit.decoder.layers.14.mlp.linear_fc2.weight lr_decay_rate 0.3486784401000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.mlp.linear_fc2.weight key (1.0, 0.03874204890000001, False, False)name module.module.external_feature_model.vit.decoder.layers.19.mlp.linear_fc2.weight lr_decay_rate 0.5904900000000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.ls2 key (0.0, 0.015009463529699918, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.mlp.linear_fc2.weight key (1.0, 0.03874204890000001, False, False) name module.module.external_feature_model.vit.decoder.layers.15.ls1 lr_decay_rate 0.3874204890000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.input_layernorm.weight key (0.0, 0.03486784401000001, False, False)name module.module.external_feature_model.vit.decoder.layers.5.self_attention.linear_qkv.bias lr_decay_rate 0.13508517176729928 name module.module.external_feature_model.vit.decoder.layers.12.self_attention.linear_proj.bias lr_decay_rate 0.2824295364810001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.mlp.linear_fc2.bias key (0.0, 0.007976644307687256, False, False) name module.module.external_feature_model.vit.decoder.layers.13.ls2 lr_decay_rate 0.31381059609000006name module.module.external_feature_model.vit.decoder.layers.14.pre_mlp_layernorm.weight lr_decay_rate 0.3486784401000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.mlp.linear_fc1.weight key (1.0, 0.03874204890000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.mlp.linear_fc2.weight key (1.0, 0.05904900000000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.mlp.linear_fc2.weight key (1.0, 0.03486784401000001, False, False) name module.module.external_feature_model.vit.decoder.layers.15.mlp.linear_fc2.bias lr_decay_rate 0.3874204890000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.self_attention.linear_qkv.bias key (0.0, 0.013508517176729929, False, False) name module.module.external_feature_model.vit.decoder.layers.6.input_layernorm.weight lr_decay_rate 0.15009463529699918name module.module.external_feature_model.vit.decoder.layers.14.input_layernorm.bias lr_decay_rate 0.3486784401000001name module.module.external_feature_model.vit.decoder.layers.15.mlp.linear_fc2.bias lr_decay_rate 0.3874204890000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.ls1 key (0.0, 0.03874204890000001, False, False) name module.module.external_feature_model.vit.decoder.layers.15.mlp.linear_fc1.bias lr_decay_rate 0.3874204890000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.self_attention.linear_proj.bias key (0.0, 0.028242953648100012, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.pre_mlp_layernorm.weight key (0.0, 0.03486784401000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.ls2 key (0.0, 0.031381059609000006, False, False) name module.module.external_feature_model.vit.decoder.layers.1.ls1 lr_decay_rate 0.08862938119652507name module.module.external_feature_model.vit.decoder.layers.19.mlp.linear_fc2.bias lr_decay_rate 0.5904900000000001 name module.module.external_feature_model.vit.decoder.layers.14.mlp.linear_fc2.bias lr_decay_rate 0.3486784401000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.mlp.linear_fc2.bias key (0.0, 0.03874204890000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.input_layernorm.bias key (0.0, 0.03486784401000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.mlp.linear_fc2.bias key (0.0, 0.03874204890000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.mlp.linear_fc1.bias key (0.0, 0.03874204890000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.input_layernorm.weight key (0.0, 0.015009463529699918, False, False)name module.module.external_feature_model.vit.decoder.layers.5.pre_mlp_layernorm.weight lr_decay_rate 0.13508517176729928 name module.module.external_feature_model.vit.decoder.layers.15.ls2 lr_decay_rate 0.3874204890000001 name module.module.external_feature_model.vit.decoder.layers.14.pre_mlp_layernorm.bias lr_decay_rate 0.3486784401000001 name module.module.external_feature_model.vit.decoder.layers.12.self_attention.linear_qkv.weight lr_decay_rate 0.2824295364810001name module.module.external_feature_model.vit.decoder.layers.13.input_layernorm.weight lr_decay_rate 0.31381059609000006_get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.mlp.linear_fc2.bias key (0.0, 0.05904900000000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.ls1 key (0.0, 0.008862938119652507, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.mlp.linear_fc2.bias key (0.0, 0.03486784401000001, False, False) name module.module.external_feature_model.vit.decoder.layers.16.ls1 lr_decay_rate 0.4304672100000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.pre_mlp_layernorm.weight key (0.0, 0.013508517176729929, False, False)name module.module.external_feature_model.vit.decoder.layers.6.input_layernorm.bias lr_decay_rate 0.15009463529699918_get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.ls2 key (0.0, 0.03874204890000001, False, False)name module.module.external_feature_model.vit.decoder.layers.15.mlp.linear_fc2.weight lr_decay_rate 0.3874204890000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.pre_mlp_layernorm.bias key (0.0, 0.03486784401000001, False, False) name module.module.external_feature_model.vit.decoder.layers.16.ls1 lr_decay_rate 0.4304672100000001 name module.module.external_feature_model.vit.decoder.layers.14.self_attention.linear_proj.weight lr_decay_rate 0.3486784401000001 name module.module.external_feature_model.vit.decoder.layers.1.ls2 lr_decay_rate 0.08862938119652507_get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.input_layernorm.weight key (0.0, 0.031381059609000006, False, False) name module.module.external_feature_model.vit.decoder.layers.20.ls1 lr_decay_rate 0.6561_get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.self_attention.linear_qkv.weight key (1.0, 0.028242953648100012, False, False) name module.module.external_feature_model.vit.decoder.layers.15.ls1 lr_decay_rate 0.3874204890000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.ls1 key (0.0, 0.04304672100000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.input_layernorm.bias key (0.0, 0.015009463529699918, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.mlp.linear_fc2.weight key (1.0, 0.03874204890000001, False, False)name module.module.external_feature_model.vit.decoder.layers.5.pre_mlp_layernorm.bias lr_decay_rate 0.13508517176729928 name module.module.external_feature_model.vit.decoder.layers.14.mlp.linear_fc1.weight lr_decay_rate 0.3486784401000001name module.module.external_feature_model.vit.decoder.layers.15.input_layernorm.weight lr_decay_rate 0.3874204890000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.ls1 key (0.0, 0.04304672100000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.self_attention.linear_proj.weight key (1.0, 0.03486784401000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.ls2 key (0.0, 0.008862938119652507, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.ls1 key (0.0, 0.06561, False, False) name module.module.external_feature_model.vit.decoder.layers.13.input_layernorm.bias lr_decay_rate 0.31381059609000006 name module.module.external_feature_model.vit.decoder.layers.12.self_attention.linear_qkv.bias lr_decay_rate 0.2824295364810001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.ls1 key (0.0, 0.03874204890000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.pre_mlp_layernorm.bias key (0.0, 0.013508517176729929, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.mlp.linear_fc1.weight key (1.0, 0.03486784401000001, False, False)name module.module.external_feature_model.vit.decoder.layers.16.ls2 lr_decay_rate 0.4304672100000001 name module.module.external_feature_model.vit.decoder.layers.15.mlp.linear_fc2.bias lr_decay_rate 0.3874204890000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.input_layernorm.weight key (0.0, 0.03874204890000001, False, False) name module.module.external_feature_model.vit.decoder.layers.16.ls2 lr_decay_rate 0.4304672100000001name module.module.external_feature_model.vit.decoder.layers.6.self_attention.linear_proj.weight lr_decay_rate 0.15009463529699918 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.input_layernorm.bias key (0.0, 0.031381059609000006, False, False)name module.module.external_feature_model.vit.decoder.layers.20.ls2 lr_decay_rate 0.6561name module.module.external_feature_model.vit.decoder.layers.1.input_layernorm.weight lr_decay_rate 0.08862938119652507 name module.module.external_feature_model.vit.decoder.layers.14.self_attention.linear_proj.bias lr_decay_rate 0.3486784401000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.self_attention.linear_qkv.bias key (0.0, 0.028242953648100012, False, False)name module.module.external_feature_model.vit.decoder.layers.15.ls2 lr_decay_rate 0.3874204890000001 name module.module.external_feature_model.vit.decoder.layers.5.mlp.linear_fc1.weight lr_decay_rate 0.13508517176729928_get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.ls2 key (0.0, 0.04304672100000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.mlp.linear_fc2.bias key (0.0, 0.03874204890000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.ls2 key (0.0, 0.06561, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.self_attention.linear_proj.bias key (0.0, 0.03486784401000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.self_attention.linear_proj.weight key (1.0, 0.015009463529699918, False, False) name module.module.external_feature_model.vit.decoder.layers.15.input_layernorm.bias lr_decay_rate 0.3874204890000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.ls2 key (0.0, 0.04304672100000001, False, False)name module.module.external_feature_model.vit.decoder.layers.14.mlp.linear_fc1.bias lr_decay_rate 0.3486784401000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.ls2 key (0.0, 0.03874204890000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.input_layernorm.weight key (0.0, 0.008862938119652507, False, False) name module.module.external_feature_model.vit.decoder.layers.13.self_attention.linear_proj.weight lr_decay_rate 0.31381059609000006_get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.mlp.linear_fc1.weight key (1.0, 0.013508517176729929, False, False) name module.module.external_feature_model.vit.decoder.layers.16.input_layernorm.weight lr_decay_rate 0.4304672100000001name module.module.external_feature_model.vit.decoder.layers.12.pre_mlp_layernorm.weight lr_decay_rate 0.2824295364810001name module.module.external_feature_model.vit.decoder.layers.16.ls1 lr_decay_rate 0.4304672100000001name module.module.external_feature_model.vit.decoder.layers.6.self_attention.linear_proj.bias lr_decay_rate 0.15009463529699918 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.mlp.linear_fc1.bias key (0.0, 0.03486784401000001, False, False)name module.module.external_feature_model.vit.decoder.layers.20.input_layernorm.weight lr_decay_rate 0.6561 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.input_layernorm.bias key (0.0, 0.03874204890000001, False, False)name module.module.external_feature_model.vit.decoder.layers.14.self_attention.linear_qkv.weight lr_decay_rate 0.3486784401000001 name module.module.external_feature_model.vit.decoder.layers.15.input_layernorm.weight lr_decay_rate 0.3874204890000001 name module.module.external_feature_model.vit.decoder.layers.5.mlp.linear_fc1.bias lr_decay_rate 0.13508517176729928 name module.module.external_feature_model.vit.decoder.layers.16.input_layernorm.weight lr_decay_rate 0.4304672100000001name module.module.external_feature_model.vit.decoder.layers.1.input_layernorm.bias lr_decay_rate 0.08862938119652507_get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.self_attention.linear_proj.weight key (1.0, 0.031381059609000006, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.input_layernorm.weight key (0.0, 0.04304672100000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.ls1 key (0.0, 0.04304672100000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.pre_mlp_layernorm.weight key (0.0, 0.028242953648100012, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.self_attention.linear_proj.bias key (0.0, 0.015009463529699918, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.input_layernorm.weight key (0.0, 0.06561, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.input_layernorm.weight key (0.0, 0.03874204890000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.mlp.linear_fc1.bias key (0.0, 0.013508517176729929, False, False) name module.module.external_feature_model.vit.decoder.layers.14.mlp.linear_fc2.weight lr_decay_rate 0.3486784401000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.self_attention.linear_qkv.weight key (1.0, 0.03486784401000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.input_layernorm.bias key (0.0, 0.008862938119652507, False, False) name module.module.external_feature_model.vit.decoder.layers.15.self_attention.linear_proj.weight lr_decay_rate 0.3874204890000001name module.module.external_feature_model.vit.decoder.layers.16.ls2 lr_decay_rate 0.4304672100000001name module.module.external_feature_model.vit.decoder.layers.16.input_layernorm.bias lr_decay_rate 0.4304672100000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.input_layernorm.weight key (0.0, 0.04304672100000001, False, False) name module.module.external_feature_model.vit.decoder.layers.13.self_attention.linear_proj.bias lr_decay_rate 0.31381059609000006 name module.module.external_feature_model.vit.decoder.layers.12.pre_mlp_layernorm.bias lr_decay_rate 0.2824295364810001 name module.module.external_feature_model.vit.decoder.layers.20.input_layernorm.bias lr_decay_rate 0.6561 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.mlp.linear_fc2.weight key (1.0, 0.03486784401000001, False, False) name module.module.external_feature_model.vit.decoder.layers.6.self_attention.linear_qkv.weight lr_decay_rate 0.15009463529699918_get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.ls2 key (0.0, 0.04304672100000001, False, False)name module.module.external_feature_model.vit.decoder.layers.5.mlp.linear_fc2.weight lr_decay_rate 0.13508517176729928 name module.module.external_feature_model.vit.decoder.layers.15.input_layernorm.bias lr_decay_rate 0.3874204890000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.self_attention.linear_proj.weight key (1.0, 0.03874204890000001, False, False)name module.module.external_feature_model.vit.decoder.layers.14.self_attention.linear_qkv.bias lr_decay_rate 0.3486784401000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.self_attention.linear_proj.bias key (0.0, 0.031381059609000006, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.input_layernorm.bias key (0.0, 0.04304672100000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.pre_mlp_layernorm.bias key (0.0, 0.028242953648100012, False, False)name module.module.external_feature_model.vit.decoder.layers.16.input_layernorm.bias lr_decay_rate 0.4304672100000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.input_layernorm.bias key (0.0, 0.06561, False, False) name module.module.external_feature_model.vit.decoder.layers.14.mlp.linear_fc2.bias lr_decay_rate 0.3486784401000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.mlp.linear_fc2.weight key (1.0, 0.013508517176729929, False, False)name module.module.external_feature_model.vit.decoder.layers.1.self_attention.linear_proj.weight lr_decay_rate 0.08862938119652507 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.self_attention.linear_qkv.weight key (1.0, 0.015009463529699918, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.input_layernorm.bias key (0.0, 0.03874204890000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.self_attention.linear_qkv.bias key (0.0, 0.03486784401000001, False, False) name module.module.external_feature_model.vit.decoder.layers.16.input_layernorm.weight lr_decay_rate 0.4304672100000001name module.module.external_feature_model.vit.decoder.layers.15.self_attention.linear_proj.bias lr_decay_rate 0.3874204890000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.input_layernorm.bias key (0.0, 0.04304672100000001, False, False)name module.module.external_feature_model.vit.decoder.layers.13.self_attention.linear_qkv.weight lr_decay_rate 0.31381059609000006 name module.module.external_feature_model.vit.decoder.layers.5.mlp.linear_fc2.bias lr_decay_rate 0.13508517176729928 name module.module.external_feature_model.vit.decoder.layers.12.mlp.linear_fc1.weight lr_decay_rate 0.2824295364810001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.mlp.linear_fc2.bias key (0.0, 0.03486784401000001, False, False) name module.module.external_feature_model.vit.decoder.layers.16.self_attention.linear_proj.weight lr_decay_rate 0.4304672100000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.self_attention.linear_proj.weight key (1.0, 0.008862938119652507, False, False)name module.module.external_feature_model.vit.decoder.layers.6.self_attention.linear_qkv.bias lr_decay_rate 0.15009463529699918 name module.module.external_feature_model.vit.decoder.layers.20.self_attention.linear_proj.weight lr_decay_rate 0.6561_get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.input_layernorm.weight key (0.0, 0.04304672100000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.self_attention.linear_proj.bias key (0.0, 0.03874204890000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.mlp.linear_fc2.bias key (0.0, 0.013508517176729929, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.self_attention.linear_qkv.weight key (1.0, 0.031381059609000006, False, False) name module.module.external_feature_model.vit.decoder.layers.14.pre_mlp_layernorm.weight lr_decay_rate 0.3486784401000001name module.module.external_feature_model.vit.decoder.layers.15.self_attention.linear_proj.weight lr_decay_rate 0.3874204890000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.mlp.linear_fc1.weight key (1.0, 0.028242953648100012, False, False)name module.module.external_feature_model.vit.decoder.layers.16.self_attention.linear_proj.weight lr_decay_rate 0.4304672100000001 name module.module.external_feature_model.vit.decoder.layers.1.self_attention.linear_proj.bias lr_decay_rate 0.08862938119652507_get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.self_attention.linear_proj.weight key (1.0, 0.04304672100000001, False, False)name module.module.external_feature_model.vit.decoder.layers.15.ls1 lr_decay_rate 0.3874204890000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.self_attention.linear_proj.weight key (1.0, 0.06561, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.self_attention.linear_qkv.bias key (0.0, 0.015009463529699918, False, False) name module.module.external_feature_model.vit.decoder.layers.16.input_layernorm.bias lr_decay_rate 0.4304672100000001name module.module.external_feature_model.vit.decoder.layers.15.self_attention.linear_qkv.weight lr_decay_rate 0.3874204890000001 name module.module.external_feature_model.vit.decoder.layers.13.self_attention.linear_qkv.bias lr_decay_rate 0.31381059609000006_get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.pre_mlp_layernorm.weight key (0.0, 0.03486784401000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.ls1 key (0.0, 0.03874204890000001, False, False)name module.module.external_feature_model.vit.decoder.layers.6.ls1 lr_decay_rate 0.15009463529699918name module.module.external_feature_model.vit.decoder.layers.12.mlp.linear_fc1.bias lr_decay_rate 0.2824295364810001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.self_attention.linear_proj.weight key (1.0, 0.03874204890000001, False, False)name module.module.external_feature_model.vit.decoder.layers.20.self_attention.linear_proj.bias lr_decay_rate 0.6561 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.self_attention.linear_proj.weight key (1.0, 0.04304672100000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.self_attention.linear_proj.bias key (0.0, 0.008862938119652507, False, False) name module.module.external_feature_model.vit.decoder.layers.16.self_attention.linear_proj.bias lr_decay_rate 0.4304672100000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.self_attention.linear_qkv.weight key (1.0, 0.03874204890000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.input_layernorm.bias key (0.0, 0.04304672100000001, False, False) name module.module.external_feature_model.vit.decoder.layers.6.pre_mlp_layernorm.weight lr_decay_rate 0.15009463529699918_get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.self_attention.linear_qkv.bias key (0.0, 0.031381059609000006, False, False) name module.module.external_feature_model.vit.decoder.layers.14.pre_mlp_layernorm.bias lr_decay_rate 0.3486784401000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.ls1 key (0.0, 0.015009463529699918, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.self_attention.linear_proj.bias key (0.0, 0.06561, False, False) name module.module.external_feature_model.vit.decoder.layers.15.ls2 lr_decay_rate 0.3874204890000001 name module.module.external_feature_model.vit.decoder.layers.15.self_attention.linear_proj.bias lr_decay_rate 0.3874204890000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.mlp.linear_fc1.bias key (0.0, 0.028242953648100012, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.self_attention.linear_proj.bias key (0.0, 0.04304672100000001, False, False)name module.module.external_feature_model.vit.decoder.layers.16.self_attention.linear_proj.bias lr_decay_rate 0.4304672100000001 name module.module.external_feature_model.vit.decoder.layers.15.self_attention.linear_qkv.bias lr_decay_rate 0.3874204890000001name module.module.external_feature_model.vit.decoder.layers.1.self_attention.linear_qkv.weight lr_decay_rate 0.08862938119652507 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.pre_mlp_layernorm.weight key (0.0, 0.015009463529699918, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.pre_mlp_layernorm.bias key (0.0, 0.03486784401000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.self_attention.linear_proj.bias key (0.0, 0.03874204890000001, False, False)name module.module.external_feature_model.vit.decoder.layers.6.ls2 lr_decay_rate 0.15009463529699918name module.module.external_feature_model.vit.decoder.layers.20.self_attention.linear_qkv.weight lr_decay_rate 0.6561 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.ls2 key (0.0, 0.03874204890000001, False, False) name module.module.external_feature_model.vit.decoder.layers.13.pre_mlp_layernorm.weight lr_decay_rate 0.31381059609000006name module.module.external_feature_model.vit.decoder.layers.16.self_attention.linear_proj.weight lr_decay_rate 0.4304672100000001 name module.module.external_feature_model.vit.decoder.layers.12.mlp.linear_fc2.weight lr_decay_rate 0.2824295364810001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.self_attention.linear_proj.bias key (0.0, 0.04304672100000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.self_attention.linear_qkv.bias key (0.0, 0.03874204890000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.self_attention.linear_qkv.weight key (1.0, 0.008862938119652507, False, False)name module.module.external_feature_model.vit.decoder.layers.16.self_attention.linear_qkv.weight lr_decay_rate 0.4304672100000001 name module.module.external_feature_model.vit.decoder.layers.6.pre_mlp_layernorm.bias lr_decay_rate 0.15009463529699918_get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.ls2 key (0.0, 0.015009463529699918, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.self_attention.linear_qkv.weight key (1.0, 0.06561, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.pre_mlp_layernorm.weight key (0.0, 0.031381059609000006, False, False) name module.module.external_feature_model.vit.decoder.layers.15.self_attention.linear_qkv.weight lr_decay_rate 0.3874204890000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.mlp.linear_fc2.weight key (1.0, 0.028242953648100012, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.self_attention.linear_proj.weight key (1.0, 0.04304672100000001, False, False) name module.module.external_feature_model.vit.decoder.layers.15.input_layernorm.weight lr_decay_rate 0.3874204890000001name module.module.external_feature_model.vit.decoder.layers.16.self_attention.linear_qkv.weight lr_decay_rate 0.4304672100000001 name module.module.external_feature_model.vit.decoder.layers.14.mlp.linear_fc1.weight lr_decay_rate 0.3486784401000001 name module.module.external_feature_model.vit.decoder.layers.1.self_attention.linear_qkv.bias lr_decay_rate 0.08862938119652507_get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.pre_mlp_layernorm.bias key (0.0, 0.015009463529699918, False, False) name module.module.external_feature_model.vit.decoder.layers.15.pre_mlp_layernorm.weight lr_decay_rate 0.3874204890000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.self_attention.linear_qkv.weight key (1.0, 0.04304672100000001, False, False) name module.module.external_feature_model.vit.decoder.layers.20.self_attention.linear_qkv.bias lr_decay_rate 0.6561 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.self_attention.linear_qkv.weight key (1.0, 0.03874204890000001, False, False)name module.module.external_feature_model.vit.decoder.layers.6.input_layernorm.weight lr_decay_rate 0.15009463529699918name module.module.external_feature_model.vit.decoder.layers.13.pre_mlp_layernorm.bias lr_decay_rate 0.31381059609000006name module.module.external_feature_model.vit.decoder.layers.12.mlp.linear_fc2.bias lr_decay_rate 0.2824295364810001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.mlp.linear_fc1.weight key (1.0, 0.03486784401000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.input_layernorm.weight key (0.0, 0.03874204890000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.self_attention.linear_qkv.weight key (1.0, 0.04304672100000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.pre_mlp_layernorm.weight key (0.0, 0.03874204890000001, False, False)name module.module.external_feature_model.vit.decoder.layers.16.self_attention.linear_proj.bias lr_decay_rate 0.4304672100000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.self_attention.linear_qkv.bias key (0.0, 0.06561, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.self_attention.linear_qkv.bias key (0.0, 0.008862938119652507, False, False) name module.module.external_feature_model.vit.decoder.layers.16.self_attention.linear_qkv.bias lr_decay_rate 0.4304672100000001name module.module.external_feature_model.vit.decoder.layers.6.mlp.linear_fc1.weight lr_decay_rate 0.15009463529699918 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.pre_mlp_layernorm.bias key (0.0, 0.031381059609000006, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.mlp.linear_fc2.bias key (0.0, 0.028242953648100012, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.input_layernorm.weight key (0.0, 0.015009463529699918, False, False) name module.module.external_feature_model.vit.decoder.layers.15.self_attention.linear_qkv.bias lr_decay_rate 0.3874204890000001 name module.module.external_feature_model.vit.decoder.layers.14.mlp.linear_fc1.bias lr_decay_rate 0.3486784401000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.self_attention.linear_proj.bias key (0.0, 0.04304672100000001, False, False) name module.module.external_feature_model.vit.decoder.layers.15.pre_mlp_layernorm.bias lr_decay_rate 0.3874204890000001 name module.module.external_feature_model.vit.decoder.layers.15.input_layernorm.bias lr_decay_rate 0.3874204890000001 name module.module.external_feature_model.vit.decoder.layers.16.self_attention.linear_qkv.bias lr_decay_rate 0.4304672100000001 name module.module.external_feature_model.vit.decoder.layers.20.pre_mlp_layernorm.weight lr_decay_rate 0.6561_get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.self_attention.linear_qkv.bias key (0.0, 0.04304672100000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.mlp.linear_fc1.weight key (1.0, 0.015009463529699918, False, False) name module.module.external_feature_model.vit.decoder.layers.1.pre_mlp_layernorm.weight lr_decay_rate 0.08862938119652507 name module.module.external_feature_model.vit.decoder.layers.13.mlp.linear_fc1.weight lr_decay_rate 0.31381059609000006_get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.self_attention.linear_qkv.bias key (0.0, 0.03874204890000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.mlp.linear_fc1.bias key (0.0, 0.03486784401000001, False, False)name module.module.external_feature_model.vit.decoder.layers.6.input_layernorm.bias lr_decay_rate 0.15009463529699918 name module.module.external_feature_model.vit.decoder.layers.13.ls1 lr_decay_rate 0.31381059609000006 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.self_attention.linear_qkv.bias key (0.0, 0.04304672100000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.pre_mlp_layernorm.weight key (0.0, 0.06561, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.pre_mlp_layernorm.bias key (0.0, 0.03874204890000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.input_layernorm.bias key (0.0, 0.03874204890000001, False, False)name module.module.external_feature_model.vit.decoder.layers.16.self_attention.linear_qkv.weight lr_decay_rate 0.4304672100000001name module.module.external_feature_model.vit.decoder.layers.6.mlp.linear_fc1.bias lr_decay_rate 0.15009463529699918 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.pre_mlp_layernorm.weight key (0.0, 0.008862938119652507, False, False) name module.module.external_feature_model.vit.decoder.layers.16.pre_mlp_layernorm.weight lr_decay_rate 0.4304672100000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.mlp.linear_fc1.weight key (1.0, 0.031381059609000006, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.ls1 key (0.0, 0.031381059609000006, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.input_layernorm.bias key (0.0, 0.015009463529699918, False, False) name module.module.external_feature_model.vit.decoder.layers.14.mlp.linear_fc2.weight lr_decay_rate 0.3486784401000001 name module.module.external_feature_model.vit.decoder.layers.15.pre_mlp_layernorm.weight lr_decay_rate 0.3874204890000001name module.module.external_feature_model.vit.decoder.layers.20.pre_mlp_layernorm.bias lr_decay_rate 0.6561name module.module.external_feature_model.vit.decoder.layers.16.pre_mlp_layernorm.weight lr_decay_rate 0.4304672100000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.self_attention.linear_qkv.weight key (1.0, 0.04304672100000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.mlp.linear_fc1.bias key (0.0, 0.015009463529699918, False, False) name module.module.external_feature_model.vit.decoder.layers.1.pre_mlp_layernorm.bias lr_decay_rate 0.08862938119652507_get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.pre_mlp_layernorm.weight key (0.0, 0.04304672100000001, False, False) name module.module.external_feature_model.vit.decoder.layers.15.self_attention.linear_proj.weight lr_decay_rate 0.3874204890000001name module.module.external_feature_model.vit.decoder.layers.13.ls2 lr_decay_rate 0.31381059609000006 name module.module.external_feature_model.vit.decoder.layers.15.mlp.linear_fc1.weight lr_decay_rate 0.3874204890000001 name module.module.external_feature_model.vit.decoder.layers.13.mlp.linear_fc1.bias lr_decay_rate 0.31381059609000006 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.mlp.linear_fc2.weight key (1.0, 0.03486784401000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.pre_mlp_layernorm.weight key (0.0, 0.03874204890000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.pre_mlp_layernorm.bias key (0.0, 0.06561, False, False)name module.module.external_feature_model.vit.decoder.layers.6.self_attention.linear_proj.weight lr_decay_rate 0.15009463529699918name module.module.external_feature_model.vit.decoder.layers.16.self_attention.linear_qkv.bias lr_decay_rate 0.4304672100000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.pre_mlp_layernorm.weight key (0.0, 0.04304672100000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.self_attention.linear_proj.weight key (1.0, 0.03874204890000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.pre_mlp_layernorm.bias key (0.0, 0.008862938119652507, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.mlp.linear_fc1.weight key (1.0, 0.03874204890000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.mlp.linear_fc1.bias key (0.0, 0.031381059609000006, False, False)name module.module.external_feature_model.vit.decoder.layers.6.mlp.linear_fc2.weight lr_decay_rate 0.15009463529699918 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.self_attention.linear_qkv.bias key (0.0, 0.04304672100000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.ls2 key (0.0, 0.031381059609000006, False, False)name module.module.external_feature_model.vit.decoder.layers.16.pre_mlp_layernorm.bias lr_decay_rate 0.4304672100000001 name module.module.external_feature_model.vit.decoder.layers.14.mlp.linear_fc2.bias lr_decay_rate 0.3486784401000001name module.module.external_feature_model.vit.decoder.layers.20.mlp.linear_fc1.weight lr_decay_rate 0.6561name module.module.external_feature_model.vit.decoder.layers.15.pre_mlp_layernorm.bias lr_decay_rate 0.3874204890000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.self_attention.linear_proj.weight key (1.0, 0.015009463529699918, False, False) name module.module.external_feature_model.vit.decoder.layers.16.pre_mlp_layernorm.bias lr_decay_rate 0.4304672100000001 name module.module.external_feature_model.vit.decoder.layers.15.mlp.linear_fc1.bias lr_decay_rate 0.3874204890000001name module.module.external_feature_model.vit.decoder.layers.15.self_attention.linear_proj.bias lr_decay_rate 0.3874204890000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.mlp.linear_fc2.weight key (1.0, 0.015009463529699918, False, False) name module.module.external_feature_model.vit.decoder.layers.1.mlp.linear_fc1.weight lr_decay_rate 0.08862938119652507name module.module.external_feature_model.vit.decoder.layers.13.mlp.linear_fc2.weight lr_decay_rate 0.31381059609000006 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.pre_mlp_layernorm.bias key (0.0, 0.04304672100000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.mlp.linear_fc2.bias key (0.0, 0.03486784401000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.mlp.linear_fc1.weight key (1.0, 0.06561, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.pre_mlp_layernorm.bias key (0.0, 0.03874204890000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.pre_mlp_layernorm.bias key (0.0, 0.04304672100000001, False, False)name module.module.external_feature_model.vit.decoder.layers.16.pre_mlp_layernorm.weight lr_decay_rate 0.4304672100000001 name module.module.external_feature_model.vit.decoder.layers.13.input_layernorm.weight lr_decay_rate 0.31381059609000006name module.module.external_feature_model.vit.decoder.layers.6.self_attention.linear_proj.bias lr_decay_rate 0.15009463529699918 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.mlp.linear_fc1.bias key (0.0, 0.03874204890000001, False, False)name module.module.external_feature_model.vit.decoder.layers.6.mlp.linear_fc2.bias lr_decay_rate 0.15009463529699918_get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.mlp.linear_fc2.weight key (1.0, 0.031381059609000006, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.self_attention.linear_proj.bias key (0.0, 0.03874204890000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.mlp.linear_fc1.weight key (1.0, 0.008862938119652507, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.pre_mlp_layernorm.weight key (0.0, 0.04304672100000001, False, False) name module.module.external_feature_model.vit.decoder.layers.20.mlp.linear_fc1.bias lr_decay_rate 0.6561name module.module.external_feature_model.vit.decoder.layers.16.mlp.linear_fc1.weight lr_decay_rate 0.4304672100000001 name module.module.external_feature_model.vit.decoder.layers.15.ls1 lr_decay_rate 0.3874204890000001 name module.module.external_feature_model.vit.decoder.layers.16.mlp.linear_fc1.weight lr_decay_rate 0.4304672100000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.self_attention.linear_proj.bias key (0.0, 0.015009463529699918, False, False) name module.module.external_feature_model.vit.decoder.layers.15.mlp.linear_fc1.weight lr_decay_rate 0.3874204890000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.input_layernorm.weight key (0.0, 0.031381059609000006, False, False)name module.module.external_feature_model.vit.decoder.layers.15.mlp.linear_fc2.weight lr_decay_rate 0.3874204890000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.mlp.linear_fc2.bias key (0.0, 0.015009463529699918, False, False)name module.module.external_feature_model.vit.decoder.layers.13.mlp.linear_fc2.bias lr_decay_rate 0.31381059609000006 name module.module.external_feature_model.vit.decoder.layers.1.mlp.linear_fc1.bias lr_decay_rate 0.08862938119652507_get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.mlp.linear_fc1.bias key (0.0, 0.06561, False, False)name module.module.external_feature_model.vit.decoder.layers.15.self_attention.linear_qkv.weight lr_decay_rate 0.3874204890000001 name module.module.external_feature_model.vit.decoder.layers.16.pre_mlp_layernorm.bias lr_decay_rate 0.4304672100000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.mlp.linear_fc1.weight key (1.0, 0.04304672100000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.ls1 key (0.0, 0.03874204890000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.mlp.linear_fc1.weight key (1.0, 0.04304672100000001, False, False) name module.module.external_feature_model.vit.decoder.layers.6.self_attention.linear_qkv.weight lr_decay_rate 0.15009463529699918 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.mlp.linear_fc1.weight key (1.0, 0.03874204890000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.mlp.linear_fc2.weight key (1.0, 0.03874204890000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.mlp.linear_fc2.bias key (0.0, 0.031381059609000006, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.mlp.linear_fc1.bias key (0.0, 0.008862938119652507, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.self_attention.linear_qkv.weight key (1.0, 0.03874204890000001, False, False)name module.module.external_feature_model.vit.decoder.layers.7.ls1 lr_decay_rate 0.16677181699666577name module.module.external_feature_model.vit.decoder.layers.13.input_layernorm.bias lr_decay_rate 0.31381059609000006name module.module.external_feature_model.vit.decoder.layers.16.mlp.linear_fc1.bias lr_decay_rate 0.4304672100000001 name module.module.external_feature_model.vit.decoder.layers.20.mlp.linear_fc2.weight lr_decay_rate 0.6561 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.pre_mlp_layernorm.bias key (0.0, 0.04304672100000001, False, False) name module.module.external_feature_model.vit.decoder.layers.16.mlp.linear_fc1.bias lr_decay_rate 0.4304672100000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.self_attention.linear_qkv.weight key (1.0, 0.015009463529699918, False, False)name module.module.external_feature_model.vit.decoder.layers.15.ls2 lr_decay_rate 0.3874204890000001 name module.module.external_feature_model.vit.decoder.layers.15.mlp.linear_fc2.bias lr_decay_rate 0.3874204890000001name module.module.external_feature_model.vit.decoder.layers.15.mlp.linear_fc1.bias lr_decay_rate 0.3874204890000001 name module.module.external_feature_model.vit.decoder.layers.15.self_attention.linear_qkv.bias lr_decay_rate 0.3874204890000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.input_layernorm.bias key (0.0, 0.031381059609000006, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.mlp.linear_fc1.bias key (0.0, 0.04304672100000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.ls1 key (0.0, 0.016677181699666577, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.mlp.linear_fc2.weight key (1.0, 0.06561, False, False)name module.module.external_feature_model.vit.decoder.layers.14.ls1 lr_decay_rate 0.3486784401000001name module.module.external_feature_model.vit.decoder.layers.1.mlp.linear_fc2.weight lr_decay_rate 0.08862938119652507 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.mlp.linear_fc1.bias key (0.0, 0.03874204890000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.mlp.linear_fc1.bias key (0.0, 0.04304672100000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.ls2 key (0.0, 0.03874204890000001, False, False) name module.module.external_feature_model.vit.decoder.layers.6.self_attention.linear_qkv.bias lr_decay_rate 0.15009463529699918_get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.mlp.linear_fc2.bias key (0.0, 0.03874204890000001, False, False)name module.module.external_feature_model.vit.decoder.layers.16.mlp.linear_fc1.weight lr_decay_rate 0.4304672100000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.self_attention.linear_qkv.bias key (0.0, 0.03874204890000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.mlp.linear_fc2.weight key (1.0, 0.008862938119652507, False, False)name module.module.external_feature_model.vit.decoder.layers.20.mlp.linear_fc2.bias lr_decay_rate 0.6561_get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.ls1 key (0.0, 0.03486784401000001, False, False) name module.module.external_feature_model.vit.decoder.layers.7.ls2 lr_decay_rate 0.16677181699666577name module.module.external_feature_model.vit.decoder.layers.16.mlp.linear_fc2.weight lr_decay_rate 0.4304672100000001 name module.module.external_feature_model.vit.decoder.layers.13.self_attention.linear_proj.weight lr_decay_rate 0.31381059609000006_get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.mlp.linear_fc1.weight key (1.0, 0.04304672100000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.self_attention.linear_qkv.bias key (0.0, 0.015009463529699918, False, False) name module.module.external_feature_model.vit.decoder.layers.15.mlp.linear_fc2.weight lr_decay_rate 0.3874204890000001 name module.module.external_feature_model.vit.decoder.layers.15.input_layernorm.weight lr_decay_rate 0.3874204890000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.mlp.linear_fc2.weight key (1.0, 0.04304672100000001, False, False)name module.module.external_feature_model.vit.decoder.layers.14.ls2 lr_decay_rate 0.3486784401000001name module.module.external_feature_model.vit.decoder.layers.16.mlp.linear_fc2.weight lr_decay_rate 0.4304672100000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.mlp.linear_fc2.bias key (0.0, 0.06561, False, False)name module.module.external_feature_model.vit.decoder.layers.16.ls1 lr_decay_rate 0.4304672100000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.ls2 key (0.0, 0.016677181699666577, False, False)name module.module.external_feature_model.vit.decoder.layers.1.mlp.linear_fc2.bias lr_decay_rate 0.08862938119652507name module.module.external_feature_model.vit.decoder.layers.15.pre_mlp_layernorm.weight lr_decay_rate 0.3874204890000001 name module.module.external_feature_model.vit.decoder.layers.16.mlp.linear_fc1.bias lr_decay_rate 0.4304672100000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.mlp.linear_fc2.weight key (1.0, 0.03874204890000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.self_attention.linear_proj.weight key (1.0, 0.031381059609000006, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.mlp.linear_fc2.weight key (1.0, 0.04304672100000001, False, False) name module.module.external_feature_model.vit.decoder.layers.16.mlp.linear_fc2.bias lr_decay_rate 0.4304672100000001name module.module.external_feature_model.vit.decoder.layers.6.pre_mlp_layernorm.weight lr_decay_rate 0.15009463529699918 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.mlp.linear_fc1.bias key (0.0, 0.04304672100000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.ls2 key (0.0, 0.03486784401000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.mlp.linear_fc2.bias key (0.0, 0.008862938119652507, False, False)name module.module.external_feature_model.vit.decoder.layers.21.ls1 lr_decay_rate 0.7290000000000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.input_layernorm.weight key (0.0, 0.03874204890000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.ls1 key (0.0, 0.04304672100000001, False, False) name module.module.external_feature_model.vit.decoder.layers.15.mlp.linear_fc2.bias lr_decay_rate 0.3874204890000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.pre_mlp_layernorm.weight key (0.0, 0.03874204890000001, False, False)name module.module.external_feature_model.vit.decoder.layers.7.input_layernorm.weight lr_decay_rate 0.16677181699666577 name module.module.external_feature_model.vit.decoder.layers.13.self_attention.linear_proj.bias lr_decay_rate 0.31381059609000006 name module.module.external_feature_model.vit.decoder.layers.16.mlp.linear_fc2.bias lr_decay_rate 0.4304672100000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.mlp.linear_fc2.bias key (0.0, 0.04304672100000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.pre_mlp_layernorm.weight key (0.0, 0.015009463529699918, False, False) name module.module.external_feature_model.vit.decoder.layers.16.mlp.linear_fc2.weight lr_decay_rate 0.4304672100000001 name module.module.external_feature_model.vit.decoder.layers.14.input_layernorm.weight lr_decay_rate 0.3486784401000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.mlp.linear_fc2.bias key (0.0, 0.03874204890000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.ls1 key (0.0, 0.0729, False, False)name module.module.external_feature_model.vit.decoder.layers.15.input_layernorm.bias lr_decay_rate 0.3874204890000001name module.module.external_feature_model.vit.decoder.layers.2.ls1 lr_decay_rate 0.09847709021836118_get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.input_layernorm.weight key (0.0, 0.016677181699666577, False, False) name module.module.external_feature_model.vit.decoder.layers.16.ls2 lr_decay_rate 0.4304672100000001 name module.module.external_feature_model.vit.decoder.layers.15.pre_mlp_layernorm.bias lr_decay_rate 0.3874204890000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.self_attention.linear_proj.bias key (0.0, 0.031381059609000006, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.mlp.linear_fc2.bias key (0.0, 0.04304672100000001, False, False) name module.module.external_feature_model.vit.decoder.layers.6.pre_mlp_layernorm.bias lr_decay_rate 0.15009463529699918 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.input_layernorm.weight key (0.0, 0.03486784401000001, False, False) name module.module.external_feature_model.vit.decoder.layers.17.ls1 lr_decay_rate 0.4782969000000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.mlp.linear_fc2.weight key (1.0, 0.04304672100000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.ls1 key (0.0, 0.00984770902183612, False, False)name module.module.external_feature_model.vit.decoder.layers.7.input_layernorm.bias lr_decay_rate 0.16677181699666577 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.input_layernorm.bias key (0.0, 0.03874204890000001, False, False) name module.module.external_feature_model.vit.decoder.layers.21.ls2 lr_decay_rate 0.7290000000000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.ls2 key (0.0, 0.04304672100000001, False, False) name module.module.external_feature_model.vit.decoder.layers.16.ls1 lr_decay_rate 0.4304672100000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.pre_mlp_layernorm.bias key (0.0, 0.03874204890000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.pre_mlp_layernorm.bias key (0.0, 0.015009463529699918, False, False) name module.module.external_feature_model.vit.decoder.layers.17.ls1 lr_decay_rate 0.4782969000000001 name module.module.external_feature_model.vit.decoder.layers.13.self_attention.linear_qkv.weight lr_decay_rate 0.31381059609000006 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.input_layernorm.bias key (0.0, 0.016677181699666577, False, False)name module.module.external_feature_model.vit.decoder.layers.16.mlp.linear_fc2.bias lr_decay_rate 0.4304672100000001name module.module.external_feature_model.vit.decoder.layers.14.input_layernorm.bias lr_decay_rate 0.3486784401000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.ls1 key (0.0, 0.04782969000000001, False, False)name module.module.external_feature_model.vit.decoder.layers.2.ls2 lr_decay_rate 0.09847709021836118 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.ls2 key (0.0, 0.0729, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.ls1 key (0.0, 0.04304672100000001, False, False)name module.module.external_feature_model.vit.decoder.layers.16.input_layernorm.weight lr_decay_rate 0.4304672100000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.self_attention.linear_qkv.weight key (1.0, 0.031381059609000006, False, False) name module.module.external_feature_model.vit.decoder.layers.15.mlp.linear_fc1.weight lr_decay_rate 0.3874204890000001name module.module.external_feature_model.vit.decoder.layers.15.self_attention.linear_proj.weight lr_decay_rate 0.3874204890000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.ls1 key (0.0, 0.04782969000000001, False, False)name module.module.external_feature_model.vit.decoder.layers.6.mlp.linear_fc1.weight lr_decay_rate 0.15009463529699918 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.ls2 key (0.0, 0.00984770902183612, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.mlp.linear_fc2.bias key (0.0, 0.04304672100000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.input_layernorm.bias key (0.0, 0.03486784401000001, False, False) name module.module.external_feature_model.vit.decoder.layers.17.ls2 lr_decay_rate 0.4782969000000001name module.module.external_feature_model.vit.decoder.layers.21.input_layernorm.weight lr_decay_rate 0.7290000000000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.input_layernorm.weight key (0.0, 0.04304672100000001, False, False) name module.module.external_feature_model.vit.decoder.layers.13.self_attention.linear_qkv.bias lr_decay_rate 0.31381059609000006 name module.module.external_feature_model.vit.decoder.layers.7.self_attention.linear_proj.weight lr_decay_rate 0.16677181699666577name module.module.external_feature_model.vit.decoder.layers.16.ls2 lr_decay_rate 0.4304672100000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.self_attention.linear_proj.weight key (1.0, 0.03874204890000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.mlp.linear_fc1.weight key (1.0, 0.015009463529699918, False, False) name module.module.external_feature_model.vit.decoder.layers.2.input_layernorm.weight lr_decay_rate 0.09847709021836118_get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.mlp.linear_fc1.weight key (1.0, 0.03874204890000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.ls2 key (0.0, 0.04782969000000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.input_layernorm.weight key (0.0, 0.0729, False, False) name module.module.external_feature_model.vit.decoder.layers.17.ls2 lr_decay_rate 0.4782969000000001name module.module.external_feature_model.vit.decoder.layers.17.ls1 lr_decay_rate 0.4782969000000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.self_attention.linear_qkv.bias key (0.0, 0.031381059609000006, False, False)name module.module.external_feature_model.vit.decoder.layers.16.input_layernorm.bias lr_decay_rate 0.4304672100000001 name module.module.external_feature_model.vit.decoder.layers.14.self_attention.linear_proj.weight lr_decay_rate 0.3486784401000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.ls2 key (0.0, 0.04304672100000001, False, False) name module.module.external_feature_model.vit.decoder.layers.6.mlp.linear_fc1.bias lr_decay_rate 0.15009463529699918 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.self_attention.linear_proj.weight key (1.0, 0.016677181699666577, False, False) name module.module.external_feature_model.vit.decoder.layers.15.self_attention.linear_proj.bias lr_decay_rate 0.3874204890000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.input_layernorm.weight key (0.0, 0.00984770902183612, False, False) name module.module.external_feature_model.vit.decoder.layers.15.mlp.linear_fc1.bias lr_decay_rate 0.3874204890000001name module.module.external_feature_model.vit.decoder.layers.21.input_layernorm.bias lr_decay_rate 0.7290000000000001 name module.module.external_feature_model.vit.decoder.layers.17.input_layernorm.weight lr_decay_rate 0.4782969000000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.ls1 key (0.0, 0.04782969000000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.input_layernorm.bias key (0.0, 0.04304672100000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.ls2 key (0.0, 0.04782969000000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.mlp.linear_fc1.bias key (0.0, 0.015009463529699918, False, False)name module.module.external_feature_model.vit.decoder.layers.16.input_layernorm.weight lr_decay_rate 0.4304672100000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.self_attention.linear_proj.weight key (1.0, 0.03486784401000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.input_layernorm.weight key (0.0, 0.04782969000000001, False, False)name module.module.external_feature_model.vit.decoder.layers.13.pre_mlp_layernorm.weight lr_decay_rate 0.31381059609000006_get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.mlp.linear_fc1.bias key (0.0, 0.03874204890000001, False, False)name module.module.external_feature_model.vit.decoder.layers.7.self_attention.linear_proj.bias lr_decay_rate 0.16677181699666577_get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.input_layernorm.bias key (0.0, 0.0729, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.self_attention.linear_proj.bias key (0.0, 0.03874204890000001, False, False)name module.module.external_feature_model.vit.decoder.layers.2.input_layernorm.bias lr_decay_rate 0.09847709021836118 name module.module.external_feature_model.vit.decoder.layers.17.ls2 lr_decay_rate 0.4782969000000001 name module.module.external_feature_model.vit.decoder.layers.17.input_layernorm.weight lr_decay_rate 0.4782969000000001name module.module.external_feature_model.vit.decoder.layers.6.mlp.linear_fc2.weight lr_decay_rate 0.15009463529699918name module.module.external_feature_model.vit.decoder.layers.16.self_attention.linear_proj.weight lr_decay_rate 0.4304672100000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.input_layernorm.weight key (0.0, 0.04304672100000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.self_attention.linear_proj.bias key (0.0, 0.016677181699666577, False, False)name module.module.external_feature_model.vit.decoder.layers.14.self_attention.linear_proj.bias lr_decay_rate 0.3486784401000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.input_layernorm.bias key (0.0, 0.00984770902183612, False, False)name module.module.external_feature_model.vit.decoder.layers.17.input_layernorm.bias lr_decay_rate 0.4782969000000001name module.module.external_feature_model.vit.decoder.layers.15.self_attention.linear_qkv.weight lr_decay_rate 0.3874204890000001 name module.module.external_feature_model.vit.decoder.layers.15.mlp.linear_fc2.weight lr_decay_rate 0.3874204890000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.pre_mlp_layernorm.weight key (0.0, 0.031381059609000006, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.ls2 key (0.0, 0.04782969000000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.input_layernorm.weight key (0.0, 0.04782969000000001, False, False) name module.module.external_feature_model.vit.decoder.layers.16.input_layernorm.bias lr_decay_rate 0.4304672100000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.self_attention.linear_proj.weight key (1.0, 0.04304672100000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.mlp.linear_fc2.weight key (1.0, 0.015009463529699918, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.self_attention.linear_proj.bias key (0.0, 0.03486784401000001, False, False) name module.module.external_feature_model.vit.decoder.layers.21.self_attention.linear_proj.weight lr_decay_rate 0.7290000000000001 name module.module.external_feature_model.vit.decoder.layers.7.self_attention.linear_qkv.weight lr_decay_rate 0.16677181699666577_get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.input_layernorm.bias key (0.0, 0.04782969000000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.self_attention.linear_qkv.weight key (1.0, 0.03874204890000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.mlp.linear_fc2.weight key (1.0, 0.03874204890000001, False, False) name module.module.external_feature_model.vit.decoder.layers.13.pre_mlp_layernorm.bias lr_decay_rate 0.31381059609000006name module.module.external_feature_model.vit.decoder.layers.2.self_attention.linear_proj.weight lr_decay_rate 0.09847709021836118 name module.module.external_feature_model.vit.decoder.layers.16.self_attention.linear_proj.bias lr_decay_rate 0.4304672100000001name module.module.external_feature_model.vit.decoder.layers.17.input_layernorm.bias lr_decay_rate 0.4782969000000001name module.module.external_feature_model.vit.decoder.layers.6.mlp.linear_fc2.bias lr_decay_rate 0.15009463529699918 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.input_layernorm.bias key (0.0, 0.04304672100000001, False, False)name module.module.external_feature_model.vit.decoder.layers.17.input_layernorm.weight lr_decay_rate 0.4782969000000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.self_attention.linear_proj.weight key (1.0, 0.0729, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.self_attention.linear_qkv.weight key (1.0, 0.016677181699666577, False, False)name module.module.external_feature_model.vit.decoder.layers.14.self_attention.linear_qkv.weight lr_decay_rate 0.3486784401000001name module.module.external_feature_model.vit.decoder.layers.15.mlp.linear_fc2.bias lr_decay_rate 0.3874204890000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.pre_mlp_layernorm.bias key (0.0, 0.031381059609000006, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.self_attention.linear_proj.weight key (1.0, 0.00984770902183612, False, False) name module.module.external_feature_model.vit.decoder.layers.15.self_attention.linear_qkv.bias lr_decay_rate 0.3874204890000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.mlp.linear_fc2.bias key (0.0, 0.015009463529699918, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.self_attention.linear_proj.bias key (0.0, 0.04304672100000001, False, False)name module.module.external_feature_model.vit.decoder.layers.17.self_attention.linear_proj.weight lr_decay_rate 0.4782969000000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.input_layernorm.bias key (0.0, 0.04782969000000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.self_attention.linear_qkv.weight key (1.0, 0.03486784401000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.input_layernorm.weight key (0.0, 0.04782969000000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.mlp.linear_fc2.bias key (0.0, 0.03874204890000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.self_attention.linear_qkv.bias key (0.0, 0.03874204890000001, False, False)name module.module.external_feature_model.vit.decoder.layers.21.self_attention.linear_proj.bias lr_decay_rate 0.7290000000000001name module.module.external_feature_model.vit.decoder.layers.7.self_attention.linear_qkv.bias lr_decay_rate 0.16677181699666577 name module.module.external_feature_model.vit.decoder.layers.16.self_attention.linear_proj.weight lr_decay_rate 0.4304672100000001 name module.module.external_feature_model.vit.decoder.layers.13.mlp.linear_fc1.weight lr_decay_rate 0.31381059609000006name module.module.external_feature_model.vit.decoder.layers.2.self_attention.linear_proj.bias lr_decay_rate 0.09847709021836118 name module.module.external_feature_model.vit.decoder.layers.14.self_attention.linear_qkv.bias lr_decay_rate 0.3486784401000001name module.module.external_feature_model.vit.decoder.layers.16.self_attention.linear_qkv.weight lr_decay_rate 0.4304672100000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.self_attention.linear_proj.weight key (1.0, 0.04782969000000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.self_attention.linear_proj.bias key (0.0, 0.0729, False, False)name module.module.external_feature_model.vit.decoder.layers.7.ls1 lr_decay_rate 0.16677181699666577 name module.module.external_feature_model.vit.decoder.layers.17.input_layernorm.bias lr_decay_rate 0.4782969000000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.self_attention.linear_proj.weight key (1.0, 0.04304672100000001, False, False)name module.module.external_feature_model.vit.decoder.layers.17.self_attention.linear_proj.weight lr_decay_rate 0.4782969000000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.self_attention.linear_proj.bias key (0.0, 0.00984770902183612, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.self_attention.linear_qkv.bias key (0.0, 0.016677181699666577, False, False) name module.module.external_feature_model.vit.decoder.layers.16.ls1 lr_decay_rate 0.4304672100000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.mlp.linear_fc1.weight key (1.0, 0.031381059609000006, False, False)name module.module.external_feature_model.vit.decoder.layers.15.pre_mlp_layernorm.weight lr_decay_rate 0.3874204890000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.self_attention.linear_qkv.weight key (1.0, 0.04304672100000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.self_attention.linear_qkv.bias key (0.0, 0.03486784401000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.input_layernorm.bias key (0.0, 0.04782969000000001, False, False)name module.module.external_feature_model.vit.decoder.layers.17.self_attention.linear_proj.bias lr_decay_rate 0.4782969000000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.ls1 key (0.0, 0.016677181699666577, False, False)name module.module.external_feature_model.vit.decoder.layers.16.self_attention.linear_proj.bias lr_decay_rate 0.4304672100000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.ls1 key (0.0, 0.04304672100000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.self_attention.linear_proj.weight key (1.0, 0.04782969000000001, False, False)name module.module.external_feature_model.vit.decoder.layers.21.self_attention.linear_qkv.weight lr_decay_rate 0.7290000000000001 name module.module.external_feature_model.vit.decoder.layers.7.pre_mlp_layernorm.weight lr_decay_rate 0.16677181699666577name module.module.external_feature_model.vit.decoder.layers.2.self_attention.linear_qkv.weight lr_decay_rate 0.09847709021836118 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.pre_mlp_layernorm.weight key (0.0, 0.03874204890000001, False, False)name module.module.external_feature_model.vit.decoder.layers.13.mlp.linear_fc1.bias lr_decay_rate 0.31381059609000006name module.module.external_feature_model.vit.decoder.layers.16.self_attention.linear_qkv.bias lr_decay_rate 0.4304672100000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.self_attention.linear_proj.bias key (0.0, 0.04782969000000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.self_attention.linear_proj.bias key (0.0, 0.04304672100000001, False, False)name module.module.external_feature_model.vit.decoder.layers.14.pre_mlp_layernorm.weight lr_decay_rate 0.3486784401000001 name module.module.external_feature_model.vit.decoder.layers.17.self_attention.linear_proj.weight lr_decay_rate 0.4782969000000001name module.module.external_feature_model.vit.decoder.layers.7.ls2 lr_decay_rate 0.16677181699666577 name module.module.external_feature_model.vit.decoder.layers.17.self_attention.linear_proj.bias lr_decay_rate 0.4782969000000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.pre_mlp_layernorm.weight key (0.0, 0.016677181699666577, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.self_attention.linear_qkv.weight key (1.0, 0.0729, False, False)name module.module.external_feature_model.vit.decoder.layers.16.ls2 lr_decay_rate 0.4304672100000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.self_attention.linear_qkv.weight key (1.0, 0.00984770902183612, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.mlp.linear_fc1.bias key (0.0, 0.031381059609000006, False, False)name module.module.external_feature_model.vit.decoder.layers.15.pre_mlp_layernorm.bias lr_decay_rate 0.3874204890000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.self_attention.linear_qkv.bias key (0.0, 0.04304672100000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.self_attention.linear_proj.weight key (1.0, 0.04782969000000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.pre_mlp_layernorm.weight key (0.0, 0.03486784401000001, False, False)name module.module.external_feature_model.vit.decoder.layers.17.self_attention.linear_qkv.weight lr_decay_rate 0.4782969000000001 name module.module.external_feature_model.vit.decoder.layers.16.self_attention.linear_qkv.weight lr_decay_rate 0.4304672100000001name module.module.external_feature_model.vit.decoder.layers.7.pre_mlp_layernorm.bias lr_decay_rate 0.16677181699666577 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.ls2 key (0.0, 0.04304672100000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.self_attention.linear_proj.bias key (0.0, 0.04782969000000001, False, False)name module.module.external_feature_model.vit.decoder.layers.21.self_attention.linear_qkv.bias lr_decay_rate 0.7290000000000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.ls2 key (0.0, 0.016677181699666577, False, False) name module.module.external_feature_model.vit.decoder.layers.2.self_attention.linear_qkv.bias lr_decay_rate 0.09847709021836118 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.pre_mlp_layernorm.bias key (0.0, 0.03874204890000001, False, False) name module.module.external_feature_model.vit.decoder.layers.13.mlp.linear_fc2.weight lr_decay_rate 0.31381059609000006_get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.self_attention.linear_qkv.weight key (1.0, 0.04782969000000001, False, False)name module.module.external_feature_model.vit.decoder.layers.14.pre_mlp_layernorm.bias lr_decay_rate 0.3486784401000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.pre_mlp_layernorm.bias key (0.0, 0.016677181699666577, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.self_attention.linear_qkv.bias key (0.0, 0.0729, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.self_attention.linear_qkv.weight key (1.0, 0.04304672100000001, False, False) name module.module.external_feature_model.vit.decoder.layers.16.pre_mlp_layernorm.weight lr_decay_rate 0.4304672100000001 name module.module.external_feature_model.vit.decoder.layers.17.self_attention.linear_proj.bias lr_decay_rate 0.4782969000000001 name module.module.external_feature_model.vit.decoder.layers.17.self_attention.linear_qkv.weight lr_decay_rate 0.4782969000000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.self_attention.linear_qkv.bias key (0.0, 0.00984770902183612, False, False)name module.module.external_feature_model.vit.decoder.layers.16.input_layernorm.weight lr_decay_rate 0.4304672100000001 name module.module.external_feature_model.vit.decoder.layers.7.input_layernorm.weight lr_decay_rate 0.16677181699666577_get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.mlp.linear_fc2.weight key (1.0, 0.031381059609000006, False, False)name module.module.external_feature_model.vit.decoder.layers.17.self_attention.linear_qkv.bias lr_decay_rate 0.4782969000000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.pre_mlp_layernorm.bias key (0.0, 0.03486784401000001, False, False) name module.module.external_feature_model.vit.decoder.layers.15.mlp.linear_fc1.weight lr_decay_rate 0.3874204890000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.pre_mlp_layernorm.weight key (0.0, 0.04304672100000001, False, False)name module.module.external_feature_model.vit.decoder.layers.16.self_attention.linear_qkv.bias lr_decay_rate 0.4304672100000001 name module.module.external_feature_model.vit.decoder.layers.7.mlp.linear_fc1.weight lr_decay_rate 0.16677181699666577 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.self_attention.linear_proj.bias key (0.0, 0.04782969000000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.input_layernorm.weight key (0.0, 0.04304672100000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.self_attention.linear_qkv.weight key (1.0, 0.04782969000000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.self_attention.linear_qkv.bias key (0.0, 0.04782969000000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.input_layernorm.weight key (0.0, 0.016677181699666577, False, False)name module.module.external_feature_model.vit.decoder.layers.2.pre_mlp_layernorm.weight lr_decay_rate 0.09847709021836118 name module.module.external_feature_model.vit.decoder.layers.21.pre_mlp_layernorm.weight lr_decay_rate 0.7290000000000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.mlp.linear_fc1.weight key (1.0, 0.03874204890000001, False, False)name module.module.external_feature_model.vit.decoder.layers.13.mlp.linear_fc2.bias lr_decay_rate 0.31381059609000006name module.module.external_feature_model.vit.decoder.layers.14.mlp.linear_fc1.weight lr_decay_rate 0.3486784401000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.self_attention.linear_qkv.bias key (0.0, 0.04304672100000001, False, False)name module.module.external_feature_model.vit.decoder.layers.16.pre_mlp_layernorm.bias lr_decay_rate 0.4304672100000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.mlp.linear_fc1.weight key (1.0, 0.016677181699666577, False, False) name module.module.external_feature_model.vit.decoder.layers.17.self_attention.linear_qkv.bias lr_decay_rate 0.4782969000000001 name module.module.external_feature_model.vit.decoder.layers.17.self_attention.linear_qkv.weight lr_decay_rate 0.4782969000000001name module.module.external_feature_model.vit.decoder.layers.16.input_layernorm.bias lr_decay_rate 0.4304672100000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.pre_mlp_layernorm.weight key (0.0, 0.00984770902183612, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.mlp.linear_fc2.bias key (0.0, 0.031381059609000006, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.pre_mlp_layernorm.bias key (0.0, 0.04304672100000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.pre_mlp_layernorm.weight key (0.0, 0.0729, False, False)name module.module.external_feature_model.vit.decoder.layers.7.input_layernorm.bias lr_decay_rate 0.16677181699666577name module.module.external_feature_model.vit.decoder.layers.15.mlp.linear_fc1.bias lr_decay_rate 0.3874204890000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.mlp.linear_fc1.weight key (1.0, 0.03486784401000001, False, False)name module.module.external_feature_model.vit.decoder.layers.17.pre_mlp_layernorm.weight lr_decay_rate 0.4782969000000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.self_attention.linear_qkv.weight key (1.0, 0.04782969000000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.input_layernorm.bias key (0.0, 0.04304672100000001, False, False) name module.module.external_feature_model.vit.decoder.layers.7.mlp.linear_fc1.bias lr_decay_rate 0.16677181699666577 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.self_attention.linear_qkv.bias key (0.0, 0.04782969000000001, False, False) name module.module.external_feature_model.vit.decoder.layers.16.pre_mlp_layernorm.weight lr_decay_rate 0.4304672100000001 name module.module.external_feature_model.vit.decoder.layers.2.pre_mlp_layernorm.bias lr_decay_rate 0.09847709021836118 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.pre_mlp_layernorm.weight key (0.0, 0.04782969000000001, False, False) name module.module.external_feature_model.vit.decoder.layers.14.ls1 lr_decay_rate 0.3486784401000001name module.module.external_feature_model.vit.decoder.layers.17.self_attention.linear_qkv.bias lr_decay_rate 0.4782969000000001 name module.module.external_feature_model.vit.decoder.layers.21.pre_mlp_layernorm.bias lr_decay_rate 0.7290000000000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.input_layernorm.bias key (0.0, 0.016677181699666577, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.mlp.linear_fc1.bias key (0.0, 0.016677181699666577, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.mlp.linear_fc1.bias key (0.0, 0.03874204890000001, False, False) name module.module.external_feature_model.vit.decoder.layers.16.mlp.linear_fc1.weight lr_decay_rate 0.4304672100000001 name module.module.external_feature_model.vit.decoder.layers.14.mlp.linear_fc1.bias lr_decay_rate 0.3486784401000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.pre_mlp_layernorm.bias key (0.0, 0.00984770902183612, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.pre_mlp_layernorm.weight key (0.0, 0.04304672100000001, False, False) name module.module.external_feature_model.vit.decoder.layers.17.pre_mlp_layernorm.bias lr_decay_rate 0.4782969000000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.ls1 key (0.0, 0.03486784401000001, False, False)name module.module.external_feature_model.vit.decoder.layers.16.self_attention.linear_proj.weight lr_decay_rate 0.4304672100000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.self_attention.linear_qkv.bias key (0.0, 0.04782969000000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.pre_mlp_layernorm.bias key (0.0, 0.0729, False, False) name module.module.external_feature_model.vit.decoder.layers.17.pre_mlp_layernorm.weight lr_decay_rate 0.4782969000000001name module.module.external_feature_model.vit.decoder.layers.15.mlp.linear_fc2.weight lr_decay_rate 0.3874204890000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.mlp.linear_fc1.bias key (0.0, 0.03486784401000001, False, False) name module.module.external_feature_model.vit.decoder.layers.7.mlp.linear_fc2.weight lr_decay_rate 0.16677181699666577_get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.mlp.linear_fc1.weight key (1.0, 0.04304672100000001, False, False) name module.module.external_feature_model.vit.decoder.layers.7.self_attention.linear_proj.weight lr_decay_rate 0.16677181699666577name module.module.external_feature_model.vit.decoder.layers.2.mlp.linear_fc1.weight lr_decay_rate 0.09847709021836118 name module.module.external_feature_model.vit.decoder.layers.16.pre_mlp_layernorm.bias lr_decay_rate 0.4304672100000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.pre_mlp_layernorm.bias key (0.0, 0.04782969000000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.pre_mlp_layernorm.weight key (0.0, 0.04782969000000001, False, False)name module.module.external_feature_model.vit.decoder.layers.14.ls2 lr_decay_rate 0.3486784401000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.self_attention.linear_proj.weight key (1.0, 0.04304672100000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.mlp.linear_fc2.weight key (1.0, 0.016677181699666577, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.mlp.linear_fc2.weight key (1.0, 0.03874204890000001, False, False) name module.module.external_feature_model.vit.decoder.layers.14.mlp.linear_fc2.weight lr_decay_rate 0.3486784401000001name module.module.external_feature_model.vit.decoder.layers.21.mlp.linear_fc1.weight lr_decay_rate 0.7290000000000001name module.module.external_feature_model.vit.decoder.layers.16.mlp.linear_fc1.bias lr_decay_rate 0.4304672100000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.pre_mlp_layernorm.bias key (0.0, 0.04304672100000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.mlp.linear_fc1.weight key (1.0, 0.00984770902183612, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.self_attention.linear_proj.weight key (1.0, 0.016677181699666577, False, False) name module.module.external_feature_model.vit.decoder.layers.17.pre_mlp_layernorm.bias lr_decay_rate 0.4782969000000001 name module.module.external_feature_model.vit.decoder.layers.17.pre_mlp_layernorm.weight lr_decay_rate 0.4782969000000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.ls2 key (0.0, 0.03486784401000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.mlp.linear_fc2.weight key (1.0, 0.03486784401000001, False, False)name module.module.external_feature_model.vit.decoder.layers.17.mlp.linear_fc1.weight lr_decay_rate 0.4782969000000001name module.module.external_feature_model.vit.decoder.layers.16.self_attention.linear_proj.bias lr_decay_rate 0.4304672100000001 name module.module.external_feature_model.vit.decoder.layers.15.mlp.linear_fc2.bias lr_decay_rate 0.3874204890000001 name module.module.external_feature_model.vit.decoder.layers.7.mlp.linear_fc2.bias lr_decay_rate 0.16677181699666577 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.mlp.linear_fc1.bias key (0.0, 0.04304672100000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.mlp.linear_fc1.weight key (1.0, 0.0729, False, False)name module.module.external_feature_model.vit.decoder.layers.16.mlp.linear_fc1.weight lr_decay_rate 0.4304672100000001name module.module.external_feature_model.vit.decoder.layers.2.mlp.linear_fc1.bias lr_decay_rate 0.09847709021836118 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.pre_mlp_layernorm.bias key (0.0, 0.04782969000000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.pre_mlp_layernorm.weight key (0.0, 0.04782969000000001, False, False) name module.module.external_feature_model.vit.decoder.layers.7.self_attention.linear_proj.bias lr_decay_rate 0.16677181699666577 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.mlp.linear_fc2.bias key (0.0, 0.016677181699666577, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.mlp.linear_fc1.weight key (1.0, 0.04782969000000001, False, False)name module.module.external_feature_model.vit.decoder.layers.14.mlp.linear_fc2.bias lr_decay_rate 0.3486784401000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.self_attention.linear_proj.bias key (0.0, 0.04304672100000001, False, False)name module.module.external_feature_model.vit.decoder.layers.14.input_layernorm.weight lr_decay_rate 0.3486784401000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.mlp.linear_fc1.weight key (1.0, 0.04304672100000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.mlp.linear_fc2.bias key (0.0, 0.03874204890000001, False, False) name module.module.external_feature_model.vit.decoder.layers.16.mlp.linear_fc2.weight lr_decay_rate 0.4304672100000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.mlp.linear_fc1.bias key (0.0, 0.00984770902183612, False, False)name module.module.external_feature_model.vit.decoder.layers.21.mlp.linear_fc1.bias lr_decay_rate 0.7290000000000001 name module.module.external_feature_model.vit.decoder.layers.17.pre_mlp_layernorm.bias lr_decay_rate 0.4782969000000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.self_attention.linear_proj.bias key (0.0, 0.016677181699666577, False, False)name module.module.external_feature_model.vit.decoder.layers.17.mlp.linear_fc1.weight lr_decay_rate 0.4782969000000001name module.module.external_feature_model.vit.decoder.layers.17.mlp.linear_fc1.bias lr_decay_rate 0.4782969000000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.mlp.linear_fc2.bias key (0.0, 0.03486784401000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.input_layernorm.weight key (0.0, 0.03486784401000001, False, False) name module.module.external_feature_model.vit.decoder.layers.8.ls1 lr_decay_rate 0.18530201888518416 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.mlp.linear_fc2.weight key (1.0, 0.04304672100000001, False, False) name module.module.external_feature_model.vit.decoder.layers.16.mlp.linear_fc1.bias lr_decay_rate 0.4304672100000001 name module.module.external_feature_model.vit.decoder.layers.16.self_attention.linear_qkv.weight lr_decay_rate 0.4304672100000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.mlp.linear_fc1.bias key (0.0, 0.0729, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.pre_mlp_layernorm.bias key (0.0, 0.04782969000000001, False, False) name module.module.external_feature_model.vit.decoder.layers.16.ls1 lr_decay_rate 0.4304672100000001name module.module.external_feature_model.vit.decoder.layers.2.mlp.linear_fc2.weight lr_decay_rate 0.09847709021836118 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.mlp.linear_fc1.weight key (1.0, 0.04782969000000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.mlp.linear_fc1.bias key (0.0, 0.04782969000000001, False, False) name module.module.external_feature_model.vit.decoder.layers.16.mlp.linear_fc2.bias lr_decay_rate 0.4304672100000001name module.module.external_feature_model.vit.decoder.layers.14.input_layernorm.bias lr_decay_rate 0.3486784401000001 name module.module.external_feature_model.vit.decoder.layers.15.ls1 lr_decay_rate 0.3874204890000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.mlp.linear_fc1.bias key (0.0, 0.04304672100000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.ls1 key (0.0, 0.018530201888518418, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.self_attention.linear_qkv.weight key (1.0, 0.04304672100000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.ls1 key (0.0, 0.04304672100000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.mlp.linear_fc2.weight key (1.0, 0.00984770902183612, False, False) name module.module.external_feature_model.vit.decoder.layers.21.mlp.linear_fc2.weight lr_decay_rate 0.7290000000000001 name module.module.external_feature_model.vit.decoder.layers.17.mlp.linear_fc1.weight lr_decay_rate 0.4782969000000001name module.module.external_feature_model.vit.decoder.layers.17.mlp.linear_fc2.weight lr_decay_rate 0.4782969000000001name module.module.external_feature_model.vit.decoder.layers.17.mlp.linear_fc1.bias lr_decay_rate 0.4782969000000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.mlp.linear_fc2.bias key (0.0, 0.04304672100000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.input_layernorm.bias key (0.0, 0.03486784401000001, False, False) name module.module.external_feature_model.vit.decoder.layers.8.ls2 lr_decay_rate 0.18530201888518416 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.ls1 key (0.0, 0.03874204890000001, False, False) name module.module.external_feature_model.vit.decoder.layers.16.ls2 lr_decay_rate 0.4304672100000001name module.module.external_feature_model.vit.decoder.layers.16.mlp.linear_fc2.weight lr_decay_rate 0.4304672100000001name module.module.external_feature_model.vit.decoder.layers.16.self_attention.linear_qkv.bias lr_decay_rate 0.4304672100000001 name module.module.external_feature_model.vit.decoder.layers.2.mlp.linear_fc2.bias lr_decay_rate 0.09847709021836118 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.mlp.linear_fc2.weight key (1.0, 0.0729, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.mlp.linear_fc1.weight key (1.0, 0.04782969000000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.mlp.linear_fc2.weight key (1.0, 0.04782969000000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.mlp.linear_fc1.bias key (0.0, 0.04782969000000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.ls2 key (0.0, 0.018530201888518418, False, False)name module.module.external_feature_model.vit.decoder.layers.17.ls1 lr_decay_rate 0.4782969000000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.self_attention.linear_qkv.bias key (0.0, 0.04304672100000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.ls2 key (0.0, 0.04304672100000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.mlp.linear_fc2.weight key (1.0, 0.04304672100000001, False, False)name module.module.external_feature_model.vit.decoder.layers.17.mlp.linear_fc1.bias lr_decay_rate 0.4782969000000001name module.module.external_feature_model.vit.decoder.layers.15.ls2 lr_decay_rate 0.3874204890000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.mlp.linear_fc2.bias key (0.0, 0.00984770902183612, False, False) name module.module.external_feature_model.vit.decoder.layers.21.mlp.linear_fc2.bias lr_decay_rate 0.7290000000000001name module.module.external_feature_model.vit.decoder.layers.14.self_attention.linear_proj.weight lr_decay_rate 0.3486784401000001 name module.module.external_feature_model.vit.class_token lr_decay_rate 1.0 name module.module.external_feature_model.vit.decoder.layers.17.mlp.linear_fc2.bias lr_decay_rate 0.4782969000000001 name module.module.external_feature_model.vit.decoder.layers.17.mlp.linear_fc2.weight lr_decay_rate 0.4782969000000001name module.module.external_feature_model.vit.decoder.layers.16.input_layernorm.weight lr_decay_rate 0.4304672100000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.ls1 key (0.0, 0.04782969000000001, False, False)name module.module.external_feature_model.vit.decoder.layers.8.input_layernorm.weight lr_decay_rate 0.18530201888518416 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.mlp.linear_fc1.bias key (0.0, 0.04782969000000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.ls2 key (0.0, 0.03874204890000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.mlp.linear_fc2.bias key (0.0, 0.0729, False, False)name module.module.external_feature_model.vit.decoder.layers.16.pre_mlp_layernorm.weight lr_decay_rate 0.4304672100000001 name module.module.external_feature_model.vit.decoder.layers.16.mlp.linear_fc2.bias lr_decay_rate 0.4304672100000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.self_attention.linear_proj.weight key (1.0, 0.03486784401000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.mlp.linear_fc2.weight key (1.0, 0.04782969000000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.mlp.linear_fc2.bias key (0.0, 0.04782969000000001, False, False)name module.module.external_feature_model.vit.decoder.layers.3.ls1 lr_decay_rate 0.10941898913151242 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.input_layernorm.weight key (0.0, 0.04304672100000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.input_layernorm.weight key (0.0, 0.018530201888518418, False, False)name module.module.external_feature_model.vit.decoder.layers.17.ls2 lr_decay_rate 0.4782969000000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.pre_mlp_layernorm.weight key (0.0, 0.04304672100000001, False, False)name module.module.external_feature_model.vit.decoder.layers.22.ls1 lr_decay_rate 0.81_get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.mlp.linear_fc2.bias key (0.0, 0.04304672100000001, False, False) name module.module.external_feature_model.vit.decoder.layers.17.mlp.linear_fc2.weight lr_decay_rate 0.4782969000000001 name module.module.external_feature_model.vit.decoder.layers.15.input_layernorm.weight lr_decay_rate 0.3874204890000001 name module.module.external_feature_model.vit.decoder.layers.17.mlp.linear_fc2.bias lr_decay_rate 0.4782969000000001name module.module.external_feature_model.vit.decoder.layers.14.self_attention.linear_proj.bias lr_decay_rate 0.3486784401000001name module.module.external_feature_model.vit.decoder.layers.16.input_layernorm.bias lr_decay_rate 0.4304672100000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.ls1 key (0.0, 0.010941898913151242, False, False) name module.module.external_feature_model.vit.decoder.layers.18.ls1 lr_decay_rate 0.531441 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.ls2 key (0.0, 0.04782969000000001, False, False) name module.module.external_feature_model.vit.decoder.layers.8.input_layernorm.bias lr_decay_rate 0.18530201888518416 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.mlp.linear_fc2.weight key (1.0, 0.04782969000000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.input_layernorm.weight key (0.0, 0.03874204890000001, False, False)name module.module.external_feature_model.vit.decoder.layers.16.pre_mlp_layernorm.bias lr_decay_rate 0.4304672100000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.mlp.linear_fc2.bias key (0.0, 0.04782969000000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.ls1 key (0.0, 0.08100000000000002, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.self_attention.linear_proj.bias key (0.0, 0.03486784401000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.input_layernorm.bias key (0.0, 0.04304672100000001, False, False) name module.module.external_feature_model.vit.decoder.layers.17.ls1 lr_decay_rate 0.4782969000000001 name module.module.external_feature_model.vit.decoder.layers.3.ls2 lr_decay_rate 0.10941898913151242_get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.ls1 key (0.0, 0.05314410000000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.input_layernorm.bias key (0.0, 0.018530201888518418, False, False) name module.module.external_feature_model.vit.decoder.layers.17.input_layernorm.weight lr_decay_rate 0.4782969000000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.pre_mlp_layernorm.bias key (0.0, 0.04304672100000001, False, False) name module.module.external_feature_model.vit.decoder.layers.17.mlp.linear_fc2.bias lr_decay_rate 0.4782969000000001name module.module.external_feature_model.vit.decoder.layers.22.ls2 lr_decay_rate 0.81 name module.module.external_feature_model.vit.decoder.layers.15.input_layernorm.bias lr_decay_rate 0.3874204890000001 name module.module.external_feature_model.vit.decoder.layers.7.self_attention.linear_qkv.weight lr_decay_rate 0.16677181699666577 name module.module.external_feature_model.vit.decoder.layers.14.self_attention.linear_qkv.weight lr_decay_rate 0.3486784401000001name module.module.external_feature_model.vit.decoder.layers.18.ls1 lr_decay_rate 0.531441_get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.ls2 key (0.0, 0.010941898913151242, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.ls1 key (0.0, 0.04782969000000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.input_layernorm.weight key (0.0, 0.04782969000000001, False, False)name module.module.external_feature_model.vit.decoder.layers.18.ls2 lr_decay_rate 0.531441name module.module.external_feature_model.vit.decoder.layers.8.self_attention.linear_proj.weight lr_decay_rate 0.18530201888518416_get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.mlp.linear_fc2.bias key (0.0, 0.04782969000000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.ls2 key (0.0, 0.08100000000000002, False, False)name module.module.external_feature_model.vit.decoder.layers.16.self_attention.linear_proj.weight lr_decay_rate 0.4304672100000001name module.module.external_feature_model.vit.decoder.layers.16.mlp.linear_fc1.weight lr_decay_rate 0.4304672100000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.input_layernorm.bias key (0.0, 0.03874204890000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.self_attention.linear_qkv.weight key (1.0, 0.016677181699666577, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.self_attention.linear_qkv.weight key (1.0, 0.03486784401000001, False, False) name module.module.external_feature_model.vit.decoder.layers.17.ls2 lr_decay_rate 0.4782969000000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.ls1 key (0.0, 0.05314410000000001, False, False)name module.module.external_feature_model.vit.decoder.layers.3.input_layernorm.weight lr_decay_rate 0.10941898913151242_get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.ls2 key (0.0, 0.05314410000000001, False, False) name module.module.external_feature_model.vit.decoder.layers.17.input_layernorm.bias lr_decay_rate 0.4782969000000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.self_attention.linear_proj.weight key (1.0, 0.018530201888518418, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.mlp.linear_fc1.weight key (1.0, 0.04304672100000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.self_attention.linear_proj.weight key (1.0, 0.04304672100000001, False, False) name module.module.external_feature_model.vit.decoder.layers.22.input_layernorm.weight lr_decay_rate 0.81name module.module.external_feature_model.vit.decoder.layers.18.ls1 lr_decay_rate 0.531441name module.module.external_feature_model.vit.decoder.layers.7.self_attention.linear_qkv.bias lr_decay_rate 0.16677181699666577name module.module.external_feature_model.vit.decoder.layers.14.self_attention.linear_qkv.bias lr_decay_rate 0.3486784401000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.input_layernorm.weight key (0.0, 0.010941898913151242, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.ls2 key (0.0, 0.04782969000000001, False, False)name module.module.external_feature_model.vit.decoder.layers.15.self_attention.linear_proj.weight lr_decay_rate 0.3874204890000001name module.module.external_feature_model.vit.decoder.layers.18.ls2 lr_decay_rate 0.531441name module.module.external_feature_model.vit.decoder.layers.16.mlp.linear_fc1.bias lr_decay_rate 0.4304672100000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.input_layernorm.bias key (0.0, 0.04782969000000001, False, False) name module.module.external_feature_model.vit.decoder.layers.18.input_layernorm.weight lr_decay_rate 0.531441name module.module.external_feature_model.vit.decoder.layers.8.self_attention.linear_proj.bias lr_decay_rate 0.18530201888518416 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.input_layernorm.weight key (0.0, 0.08100000000000002, False, False) name module.module.external_feature_model.vit.decoder.layers.16.self_attention.linear_proj.bias lr_decay_rate 0.4304672100000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.self_attention.linear_qkv.bias key (0.0, 0.03486784401000001, False, False)name module.module.external_feature_model.vit.decoder.layers.3.input_layernorm.bias lr_decay_rate 0.10941898913151242_get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.ls1 key (0.0, 0.05314410000000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.self_attention.linear_qkv.bias key (0.0, 0.016677181699666577, False, False) name module.module.external_feature_model.vit.decoder.layers.17.input_layernorm.weight lr_decay_rate 0.4782969000000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.mlp.linear_fc1.bias key (0.0, 0.04304672100000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.ls2 key (0.0, 0.05314410000000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.self_attention.linear_proj.weight key (1.0, 0.03874204890000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.self_attention.linear_proj.bias key (0.0, 0.018530201888518418, False, False) _get_param_groups name module.module.external_feature_model.vit.class_token key (1.0, 0.1, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.input_layernorm.weight key (0.0, 0.05314410000000001, False, False)name module.module.external_feature_model.vit.decoder.layers.17.self_attention.linear_proj.weight lr_decay_rate 0.4782969000000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.input_layernorm.bias key (0.0, 0.010941898913151242, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.self_attention.linear_proj.bias key (0.0, 0.04304672100000001, False, False)name module.module.external_feature_model.vit.decoder.layers.22.input_layernorm.bias lr_decay_rate 0.81 name module.module.external_feature_model.vit.decoder.layers.18.ls2 lr_decay_rate 0.531441 name module.module.external_feature_model.vit.decoder.layers.14.pre_mlp_layernorm.weight lr_decay_rate 0.3486784401000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.input_layernorm.weight key (0.0, 0.04782969000000001, False, False) name module.module.external_feature_model.vit.decoder.layers.16.mlp.linear_fc2.weight lr_decay_rate 0.4304672100000001 name module.module.external_feature_model.vit.decoder.layers.7.pre_mlp_layernorm.weight lr_decay_rate 0.16677181699666577name module.module.external_feature_model.vit.decoder.layers.15.self_attention.linear_proj.bias lr_decay_rate 0.3874204890000001name module.module.external_feature_model.vit.decoder.layers.18.input_layernorm.weight lr_decay_rate 0.531441_get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.input_layernorm.bias key (0.0, 0.08100000000000002, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.self_attention.linear_proj.weight key (1.0, 0.04782969000000001, False, False) name module.module.external_feature_model.vit.decoder.layers.8.self_attention.linear_qkv.weight lr_decay_rate 0.18530201888518416name module.module.external_feature_model.vit.decoder.layers.18.input_layernorm.bias lr_decay_rate 0.531441 name module.module.external_feature_model.vit.decoder.layers.16.self_attention.linear_qkv.weight lr_decay_rate 0.4304672100000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.ls2 key (0.0, 0.05314410000000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.pre_mlp_layernorm.weight key (0.0, 0.03486784401000001, False, False) name module.module.external_feature_model.vit.decoder.layers.3.self_attention.linear_proj.weight lr_decay_rate 0.10941898913151242_get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.mlp.linear_fc2.weight key (1.0, 0.04304672100000001, False, False) name module.module.external_feature_model.vit.decoder.layers.17.input_layernorm.bias lr_decay_rate 0.4782969000000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.input_layernorm.weight key (0.0, 0.05314410000000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.pre_mlp_layernorm.weight key (0.0, 0.016677181699666577, False, False)name module.module.external_feature_model.vit.conv1.weight lr_decay_rate 0.0717897987691853_get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.self_attention.linear_qkv.weight key (1.0, 0.018530201888518418, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.self_attention.linear_proj.bias key (0.0, 0.03874204890000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.self_attention.linear_qkv.weight key (1.0, 0.04304672100000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.input_layernorm.bias key (0.0, 0.05314410000000001, False, False) name module.module.external_feature_model.vit.decoder.layers.17.self_attention.linear_proj.bias lr_decay_rate 0.4782969000000001name module.module.external_feature_model.vit.decoder.layers.22.self_attention.linear_proj.weight lr_decay_rate 0.81 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.input_layernorm.bias key (0.0, 0.04782969000000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.self_attention.linear_proj.weight key (1.0, 0.010941898913151242, False, False) name module.module.external_feature_model.vit.decoder.layers.16.mlp.linear_fc2.bias lr_decay_rate 0.4304672100000001 name module.module.external_feature_model.vit.decoder.layers.14.pre_mlp_layernorm.bias lr_decay_rate 0.3486784401000001 name module.module.external_feature_model.vit.decoder.layers.18.input_layernorm.weight lr_decay_rate 0.531441 name module.module.external_feature_model.vit.decoder.layers.18.input_layernorm.bias lr_decay_rate 0.531441 name module.module.external_feature_model.vit.decoder.layers.7.pre_mlp_layernorm.bias lr_decay_rate 0.16677181699666577name module.module.external_feature_model.vit.decoder.layers.8.self_attention.linear_qkv.bias lr_decay_rate 0.18530201888518416 name module.module.external_feature_model.vit.decoder.layers.16.self_attention.linear_qkv.bias lr_decay_rate 0.4304672100000001_get_param_groups name module.module.external_feature_model.vit.conv1.weight key (1.0, 0.00717897987691853, False, False)name module.module.external_feature_model.vit.decoder.layers.15.self_attention.linear_qkv.weight lr_decay_rate 0.3874204890000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.self_attention.linear_proj.bias key (0.0, 0.04782969000000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.pre_mlp_layernorm.bias key (0.0, 0.03486784401000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.mlp.linear_fc2.bias key (0.0, 0.04304672100000001, False, False) name module.module.external_feature_model.vit.decoder.layers.3.self_attention.linear_proj.bias lr_decay_rate 0.10941898913151242_get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.self_attention.linear_proj.weight key (1.0, 0.08100000000000002, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.input_layernorm.weight key (0.0, 0.05314410000000001, False, False)name module.module.external_feature_model.vit.decoder.layers.18.self_attention.linear_proj.weight lr_decay_rate 0.531441_get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.pre_mlp_layernorm.bias key (0.0, 0.016677181699666577, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.input_layernorm.bias key (0.0, 0.05314410000000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.self_attention.linear_qkv.bias key (0.0, 0.018530201888518418, False, False) name module.module.external_feature_model.vit.decoder.layers.17.self_attention.linear_proj.weight lr_decay_rate 0.4782969000000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.self_attention.linear_qkv.weight key (1.0, 0.03874204890000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.self_attention.linear_qkv.bias key (0.0, 0.04304672100000001, False, False) name module.module.external_feature_model.vit.decoder.layers.17.self_attention.linear_qkv.weight lr_decay_rate 0.4782969000000001name module.module.external_feature_model.vit.conv1.bias lr_decay_rate 0.0717897987691853 name module.module.external_feature_model.vit.decoder.layers.17.ls1 lr_decay_rate 0.4782969000000001 name module.module.external_feature_model.vit.decoder.layers.14.mlp.linear_fc1.weight lr_decay_rate 0.3486784401000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.self_attention.linear_proj.bias key (0.0, 0.010941898913151242, False, False) name module.module.external_feature_model.vit.decoder.layers.22.self_attention.linear_proj.bias lr_decay_rate 0.81name module.module.external_feature_model.vit.decoder.layers.18.input_layernorm.bias lr_decay_rate 0.531441_get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.self_attention.linear_proj.weight key (1.0, 0.05314410000000001, False, False) name module.module.external_feature_model.vit.decoder.layers.18.self_attention.linear_proj.weight lr_decay_rate 0.531441_get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.self_attention.linear_proj.weight key (1.0, 0.04782969000000001, False, False)name module.module.external_feature_model.vit.decoder.layers.8.pre_mlp_layernorm.weight lr_decay_rate 0.18530201888518416_get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.self_attention.linear_qkv.weight key (1.0, 0.04782969000000001, False, False) name module.module.external_feature_model.vit.decoder.layers.15.self_attention.linear_qkv.bias lr_decay_rate 0.3874204890000001name module.module.external_feature_model.vit.decoder.layers.7.mlp.linear_fc1.weight lr_decay_rate 0.16677181699666577 _get_param_groups name module.module.external_feature_model.vit.conv1.bias key (0.0, 0.00717897987691853, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.ls1 key (0.0, 0.04782969000000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.mlp.linear_fc1.weight key (1.0, 0.03486784401000001, False, False)name module.module.external_feature_model.vit.decoder.layers.16.pre_mlp_layernorm.weight lr_decay_rate 0.4304672100000001 name module.module.external_feature_model.vit.decoder.layers.3.self_attention.linear_qkv.weight lr_decay_rate 0.10941898913151242_get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.input_layernorm.bias key (0.0, 0.05314410000000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.self_attention.linear_proj.bias key (0.0, 0.08100000000000002, False, False) name module.module.external_feature_model.vit.decoder.layers.18.self_attention.linear_proj.bias lr_decay_rate 0.531441 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.pre_mlp_layernorm.weight key (0.0, 0.018530201888518418, False, False)name module.module.external_feature_model.vit.decoder.layers.17.self_attention.linear_proj.bias lr_decay_rate 0.4782969000000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.self_attention.linear_qkv.bias key (0.0, 0.03874204890000001, False, False)name module.module.external_feature_model.vit.decoder.layers.17.self_attention.linear_qkv.bias lr_decay_rate 0.4782969000000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.self_attention.linear_proj.weight key (1.0, 0.05314410000000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.mlp.linear_fc1.weight key (1.0, 0.016677181699666577, False, False) name module.module.external_feature_model.vit.decoder.layers.17.ls2 lr_decay_rate 0.4782969000000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.self_attention.linear_qkv.weight key (1.0, 0.010941898913151242, False, False) name module.module.external_feature_model.vit.decoder.layers.14.mlp.linear_fc1.bias lr_decay_rate 0.3486784401000001 name module.module.external_feature_model.vit.decoder.layers.22.self_attention.linear_qkv.weight lr_decay_rate 0.81_get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.pre_mlp_layernorm.weight key (0.0, 0.04304672100000001, False, False)name module.module.external_feature_model.vit.position_embeddings.weight lr_decay_rate 0.0717897987691853 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.self_attention.linear_proj.bias key (0.0, 0.04782969000000001, False, False)name module.module.external_feature_model.vit.decoder.layers.18.self_attention.linear_proj.weight lr_decay_rate 0.531441 name module.module.external_feature_model.vit.decoder.layers.8.pre_mlp_layernorm.bias lr_decay_rate 0.18530201888518416_get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.self_attention.linear_qkv.bias key (0.0, 0.04782969000000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.self_attention.linear_proj.bias key (0.0, 0.05314410000000001, False, False)name module.module.external_feature_model.vit.decoder.layers.15.pre_mlp_layernorm.weight lr_decay_rate 0.3874204890000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.mlp.linear_fc1.bias key (0.0, 0.03486784401000001, False, False) name module.module.external_feature_model.vit.decoder.layers.7.mlp.linear_fc1.bias lr_decay_rate 0.16677181699666577name module.module.external_feature_model.vit.decoder.layers.18.self_attention.linear_proj.bias lr_decay_rate 0.531441name module.module.external_feature_model.vit.decoder.layers.3.self_attention.linear_qkv.bias lr_decay_rate 0.10941898913151242 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.self_attention.linear_proj.weight key (1.0, 0.05314410000000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.ls2 key (0.0, 0.04782969000000001, False, False) _get_param_groups name module.module.external_feature_model.vit.position_embeddings.weight key (1.0, 0.00717897987691853, False, False)name module.module.external_feature_model.vit.decoder.layers.17.self_attention.linear_qkv.weight lr_decay_rate 0.4782969000000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.self_attention.linear_qkv.weight key (1.0, 0.08100000000000002, False, False)name module.module.external_feature_model.vit.decoder.layers.16.pre_mlp_layernorm.bias lr_decay_rate 0.4304672100000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.self_attention.linear_proj.bias key (0.0, 0.05314410000000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.pre_mlp_layernorm.bias key (0.0, 0.018530201888518418, False, False) name module.module.external_feature_model.vit.decoder.layers.18.self_attention.linear_proj.bias lr_decay_rate 0.531441 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.pre_mlp_layernorm.weight key (0.0, 0.03874204890000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.mlp.linear_fc1.bias key (0.0, 0.016677181699666577, False, False)name module.module.external_feature_model.vit.decoder.layers.17.pre_mlp_layernorm.weight lr_decay_rate 0.4782969000000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.self_attention.linear_qkv.bias key (0.0, 0.010941898913151242, False, False)name module.module.external_feature_model.vit.decoder.layers.18.self_attention.linear_qkv.weight lr_decay_rate 0.531441 name module.module.external_feature_model.vit.decoder.layers.14.mlp.linear_fc2.weight lr_decay_rate 0.3486784401000001 name module.module.external_feature_model.vit.decoder.layers.17.input_layernorm.weight lr_decay_rate 0.4782969000000001 name module.module.external_feature_model.vit.decoder.layers.18.self_attention.linear_qkv.weight lr_decay_rate 0.531441 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.pre_mlp_layernorm.bias key (0.0, 0.04304672100000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.self_attention.linear_qkv.weight key (1.0, 0.04782969000000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.self_attention.linear_proj.bias key (0.0, 0.05314410000000001, False, False)name module.module.external_feature_model.vit.decoder.layers.22.self_attention.linear_qkv.bias lr_decay_rate 0.81 name module.module.external_feature_model.vit.decoder.layers.8.mlp.linear_fc1.weight lr_decay_rate 0.18530201888518416 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.input_layernorm.weight key (0.0, 0.04782969000000001, False, False)name module.module.external_feature_model.vit.decoder.layers.15.pre_mlp_layernorm.bias lr_decay_rate 0.3874204890000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.self_attention.linear_qkv.weight key (1.0, 0.05314410000000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.pre_mlp_layernorm.weight key (0.0, 0.04782969000000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.self_attention.linear_qkv.weight key (1.0, 0.05314410000000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.mlp.linear_fc2.weight key (1.0, 0.03486784401000001, False, False)name module.module.external_feature_model.vit.decoder.layers.7.mlp.linear_fc2.weight lr_decay_rate 0.16677181699666577 name module.module.external_feature_model.vit.decoder.layers.0.ls1 lr_decay_rate 0.07976644307687256 name module.module.external_feature_model.vit.decoder.layers.3.pre_mlp_layernorm.weight lr_decay_rate 0.10941898913151242 name module.module.external_feature_model.vit.decoder.layers.16.mlp.linear_fc1.weight lr_decay_rate 0.4304672100000001name module.module.external_feature_model.vit.decoder.layers.18.self_attention.linear_qkv.weight lr_decay_rate 0.531441 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.self_attention.linear_qkv.bias key (0.0, 0.08100000000000002, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.mlp.linear_fc1.weight key (1.0, 0.018530201888518418, False, False)name module.module.external_feature_model.vit.decoder.layers.17.self_attention.linear_qkv.bias lr_decay_rate 0.4782969000000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.pre_mlp_layernorm.bias key (0.0, 0.03874204890000001, False, False) name module.module.external_feature_model.vit.decoder.layers.17.input_layernorm.bias lr_decay_rate 0.4782969000000001name module.module.external_feature_model.vit.decoder.layers.18.self_attention.linear_qkv.bias lr_decay_rate 0.531441name module.module.external_feature_model.vit.decoder.layers.18.self_attention.linear_qkv.bias lr_decay_rate 0.531441 name module.module.external_feature_model.vit.decoder.layers.17.pre_mlp_layernorm.bias lr_decay_rate 0.4782969000000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.mlp.linear_fc2.weight key (1.0, 0.016677181699666577, False, False) name module.module.external_feature_model.vit.decoder.layers.14.mlp.linear_fc2.bias lr_decay_rate 0.3486784401000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.mlp.linear_fc1.weight key (1.0, 0.04304672100000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.self_attention.linear_qkv.bias key (0.0, 0.04782969000000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.self_attention.linear_qkv.weight key (1.0, 0.05314410000000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.ls1 key (0.0, 0.007976644307687256, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.pre_mlp_layernorm.weight key (0.0, 0.010941898913151242, False, False) name module.module.external_feature_model.vit.decoder.layers.8.mlp.linear_fc1.bias lr_decay_rate 0.18530201888518416 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.input_layernorm.bias key (0.0, 0.04782969000000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.self_attention.linear_qkv.bias key (0.0, 0.05314410000000001, False, False)name module.module.external_feature_model.vit.decoder.layers.22.pre_mlp_layernorm.weight lr_decay_rate 0.81 name module.module.external_feature_model.vit.decoder.layers.15.mlp.linear_fc1.weight lr_decay_rate 0.3874204890000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.pre_mlp_layernorm.bias key (0.0, 0.04782969000000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.self_attention.linear_qkv.bias key (0.0, 0.05314410000000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.mlp.linear_fc2.bias key (0.0, 0.03486784401000001, False, False) name module.module.external_feature_model.vit.decoder.layers.18.self_attention.linear_qkv.bias lr_decay_rate 0.531441name module.module.external_feature_model.vit.decoder.layers.7.mlp.linear_fc2.bias lr_decay_rate 0.16677181699666577 name module.module.external_feature_model.vit.decoder.layers.3.pre_mlp_layernorm.bias lr_decay_rate 0.10941898913151242 name module.module.external_feature_model.vit.decoder.layers.0.ls2 lr_decay_rate 0.07976644307687256name module.module.external_feature_model.vit.decoder.layers.16.mlp.linear_fc1.bias lr_decay_rate 0.4304672100000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.mlp.linear_fc1.bias key (0.0, 0.018530201888518418, False, False) name module.module.external_feature_model.vit.decoder.layers.17.pre_mlp_layernorm.weight lr_decay_rate 0.4782969000000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.pre_mlp_layernorm.weight key (0.0, 0.08100000000000002, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.mlp.linear_fc1.weight key (1.0, 0.03874204890000001, False, False)name module.module.external_feature_model.vit.decoder.layers.18.pre_mlp_layernorm.weight lr_decay_rate 0.531441 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.self_attention.linear_qkv.bias key (0.0, 0.05314410000000001, False, False) name module.module.external_feature_model.vit.decoder.layers.17.self_attention.linear_proj.weight lr_decay_rate 0.4782969000000001name module.module.external_feature_model.vit.decoder.layers.17.mlp.linear_fc1.weight lr_decay_rate 0.4782969000000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.ls2 key (0.0, 0.007976644307687256, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.mlp.linear_fc2.bias key (0.0, 0.016677181699666577, False, False)name module.module.external_feature_model.vit.decoder.layers.18.pre_mlp_layernorm.weight lr_decay_rate 0.531441_get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.pre_mlp_layernorm.bias key (0.0, 0.010941898913151242, False, False)name module.module.external_feature_model.vit.decoder.layers.8.mlp.linear_fc2.weight lr_decay_rate 0.18530201888518416_get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.mlp.linear_fc1.bias key (0.0, 0.04304672100000001, False, False) name module.module.external_feature_model.vit.decoder.layers.15.ls1 lr_decay_rate 0.3874204890000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.pre_mlp_layernorm.weight key (0.0, 0.05314410000000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.mlp.linear_fc1.weight key (1.0, 0.04782969000000001, False, False)name module.module.external_feature_model.vit.decoder.layers.22.pre_mlp_layernorm.bias lr_decay_rate 0.81name module.module.external_feature_model.vit.decoder.layers.15.mlp.linear_fc1.bias lr_decay_rate 0.3874204890000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.pre_mlp_layernorm.weight key (0.0, 0.04782969000000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.self_attention.linear_proj.weight key (1.0, 0.04782969000000001, False, False)name module.module.external_feature_model.vit.decoder.layers.18.pre_mlp_layernorm.weight lr_decay_rate 0.531441 name module.module.external_feature_model.vit.decoder.layers.16.mlp.linear_fc2.weight lr_decay_rate 0.4304672100000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.pre_mlp_layernorm.weight key (0.0, 0.05314410000000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.mlp.linear_fc2.weight key (1.0, 0.018530201888518418, False, False) name module.module.external_feature_model.vit.decoder.layers.8.ls1 lr_decay_rate 0.18530201888518416name module.module.external_feature_model.vit.decoder.layers.0.input_layernorm.weight lr_decay_rate 0.07976644307687256name module.module.external_feature_model.vit.decoder.layers.3.mlp.linear_fc1.weight lr_decay_rate 0.10941898913151242name module.module.external_feature_model.vit.decoder.layers.17.mlp.linear_fc1.bias lr_decay_rate 0.4782969000000001name module.module.external_feature_model.vit.decoder.layers.18.pre_mlp_layernorm.bias lr_decay_rate 0.531441_get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.ls1 key (0.0, 0.03874204890000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.pre_mlp_layernorm.weight key (0.0, 0.05314410000000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.pre_mlp_layernorm.bias key (0.0, 0.08100000000000002, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.mlp.linear_fc1.bias key (0.0, 0.03874204890000001, False, False) name module.module.external_feature_model.vit.decoder.layers.8.mlp.linear_fc2.bias lr_decay_rate 0.18530201888518416 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.mlp.linear_fc2.weight key (1.0, 0.04304672100000001, False, False)name module.module.external_feature_model.vit.decoder.layers.17.pre_mlp_layernorm.bias lr_decay_rate 0.4782969000000001name module.module.external_feature_model.vit.decoder.layers.17.self_attention.linear_proj.bias lr_decay_rate 0.4782969000000001 name module.module.external_feature_model.vit.decoder.layers.18.pre_mlp_layernorm.bias lr_decay_rate 0.531441 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.input_layernorm.weight key (0.0, 0.007976644307687256, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.ls1 key (0.0, 0.018530201888518418, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.mlp.linear_fc1.weight key (1.0, 0.010941898913151242, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.mlp.linear_fc1.bias key (0.0, 0.04782969000000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.pre_mlp_layernorm.bias key (0.0, 0.05314410000000001, False, False) name module.module.external_feature_model.vit.decoder.layers.18.pre_mlp_layernorm.bias lr_decay_rate 0.531441 name module.module.external_feature_model.vit.decoder.layers.15.ls2 lr_decay_rate 0.3874204890000001name module.module.external_feature_model.vit.decoder.layers.22.mlp.linear_fc1.weight lr_decay_rate 0.81_get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.pre_mlp_layernorm.bias key (0.0, 0.05314410000000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.mlp.linear_fc2.bias key (0.0, 0.018530201888518418, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.pre_mlp_layernorm.bias key (0.0, 0.04782969000000001, False, False) name module.module.external_feature_model.vit.decoder.layers.15.mlp.linear_fc2.weight lr_decay_rate 0.3874204890000001name module.module.external_feature_model.vit.decoder.layers.16.mlp.linear_fc2.bias lr_decay_rate 0.4304672100000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.self_attention.linear_proj.bias key (0.0, 0.04782969000000001, False, False) name module.module.external_feature_model.vit.decoder.layers.0.input_layernorm.bias lr_decay_rate 0.07976644307687256 name module.module.external_feature_model.vit.decoder.layers.3.mlp.linear_fc1.bias lr_decay_rate 0.10941898913151242_get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.pre_mlp_layernorm.bias key (0.0, 0.05314410000000001, False, False) name module.module.external_feature_model.vit.decoder.layers.8.ls2 lr_decay_rate 0.18530201888518416name module.module.external_feature_model.vit.decoder.layers.17.mlp.linear_fc2.weight lr_decay_rate 0.4782969000000001 name module.module.external_feature_model.vit.decoder.layers.18.mlp.linear_fc1.weight lr_decay_rate 0.531441_get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.mlp.linear_fc2.bias key (0.0, 0.04304672100000001, False, False)name module.module.external_feature_model.vit.decoder.layers.18.mlp.linear_fc1.weight lr_decay_rate 0.531441 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.ls2 key (0.0, 0.03874204890000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.mlp.linear_fc1.weight key (1.0, 0.08100000000000002, False, False) name module.module.external_feature_model.vit.decoder.layers.9.ls1 lr_decay_rate 0.20589113209464907_get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.mlp.linear_fc2.weight key (1.0, 0.03874204890000001, False, False)name module.module.external_feature_model.vit.decoder.layers.17.mlp.linear_fc1.weight lr_decay_rate 0.4782969000000001 name module.module.external_feature_model.vit.decoder.layers.17.self_attention.linear_qkv.weight lr_decay_rate 0.4782969000000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.ls2 key (0.0, 0.018530201888518418, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.mlp.linear_fc1.bias key (0.0, 0.010941898913151242, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.input_layernorm.bias key (0.0, 0.007976644307687256, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.mlp.linear_fc2.weight key (1.0, 0.04782969000000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.mlp.linear_fc1.weight key (1.0, 0.05314410000000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.mlp.linear_fc1.weight key (1.0, 0.05314410000000001, False, False)name module.module.external_feature_model.vit.decoder.layers.15.input_layernorm.weight lr_decay_rate 0.3874204890000001name module.module.external_feature_model.vit.decoder.layers.22.mlp.linear_fc1.bias lr_decay_rate 0.81name module.module.external_feature_model.vit.decoder.layers.18.mlp.linear_fc1.weight lr_decay_rate 0.531441 name module.module.external_feature_model.vit.decoder.layers.17.ls1 lr_decay_rate 0.4782969000000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.ls1 key (0.0, 0.02058911320946491, False, False)name module.module.external_feature_model.vit.decoder.layers.15.mlp.linear_fc2.bias lr_decay_rate 0.3874204890000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.mlp.linear_fc1.weight key (1.0, 0.04782969000000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.self_attention.linear_qkv.weight key (1.0, 0.04782969000000001, False, False) name module.module.external_feature_model.vit.decoder.layers.17.mlp.linear_fc2.bias lr_decay_rate 0.4782969000000001name module.module.external_feature_model.vit.decoder.layers.8.input_layernorm.weight lr_decay_rate 0.18530201888518416 name module.module.external_feature_model.vit.decoder.layers.3.mlp.linear_fc2.weight lr_decay_rate 0.10941898913151242_get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.mlp.linear_fc1.bias key (0.0, 0.08100000000000002, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.mlp.linear_fc1.weight key (1.0, 0.05314410000000001, False, False)name module.module.external_feature_model.vit.decoder.layers.0.self_attention.linear_proj.weight lr_decay_rate 0.07976644307687256 name module.module.external_feature_model.vit.decoder.layers.18.mlp.linear_fc1.bias lr_decay_rate 0.531441_get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.input_layernorm.weight key (0.0, 0.03874204890000001, False, False)name module.module.external_feature_model.vit.decoder.layers.18.mlp.linear_fc1.bias lr_decay_rate 0.531441 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.ls1 key (0.0, 0.04782969000000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.mlp.linear_fc2.bias key (0.0, 0.03874204890000001, False, False) name module.module.external_feature_model.vit.decoder.layers.9.ls2 lr_decay_rate 0.20589113209464907 name module.module.external_feature_model.vit.decoder.layers.17.mlp.linear_fc1.bias lr_decay_rate 0.4782969000000001 name module.module.external_feature_model.vit.decoder.layers.17.self_attention.linear_qkv.bias lr_decay_rate 0.4782969000000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.mlp.linear_fc2.bias key (0.0, 0.04782969000000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.input_layernorm.weight key (0.0, 0.018530201888518418, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.mlp.linear_fc2.weight key (1.0, 0.010941898913151242, False, False) name module.module.external_feature_model.vit.decoder.layers.18.mlp.linear_fc1.bias lr_decay_rate 0.531441name module.module.external_feature_model.vit.decoder.layers.15.input_layernorm.bias lr_decay_rate 0.3874204890000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.mlp.linear_fc1.bias key (0.0, 0.05314410000000001, False, False)name module.module.external_feature_model.vit.decoder.layers.22.mlp.linear_fc2.weight lr_decay_rate 0.81_get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.self_attention.linear_proj.weight key (1.0, 0.007976644307687256, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.mlp.linear_fc1.bias key (0.0, 0.05314410000000001, False, False) name module.module.external_feature_model.vit.decoder.layers.17.ls2 lr_decay_rate 0.4782969000000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.self_attention.linear_qkv.bias key (0.0, 0.04782969000000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.ls2 key (0.0, 0.02058911320946491, False, False)name module.module.external_feature_model.vit.decoder.layers.16.ls1 lr_decay_rate 0.4304672100000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.mlp.linear_fc1.bias key (0.0, 0.04782969000000001, False, False)name module.module.external_feature_model.vit.decoder.layers.18.ls1 lr_decay_rate 0.531441 name module.module.external_feature_model.vit.decoder.layers.3.mlp.linear_fc2.bias lr_decay_rate 0.10941898913151242_get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.input_layernorm.bias key (0.0, 0.03874204890000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.mlp.linear_fc2.weight key (1.0, 0.08100000000000002, False, False)name module.module.external_feature_model.vit.decoder.layers.8.input_layernorm.bias lr_decay_rate 0.18530201888518416 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.mlp.linear_fc1.bias key (0.0, 0.05314410000000001, False, False) name module.module.external_feature_model.vit.decoder.layers.18.mlp.linear_fc2.weight lr_decay_rate 0.531441 name module.module.external_feature_model.vit.decoder.layers.18.mlp.linear_fc2.weight lr_decay_rate 0.531441 name module.module.external_feature_model.vit.decoder.layers.0.self_attention.linear_proj.bias lr_decay_rate 0.07976644307687256 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.ls2 key (0.0, 0.04782969000000001, False, False)name module.module.external_feature_model.vit.decoder.layers.9.input_layernorm.weight lr_decay_rate 0.20589113209464907_get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.ls1 key (0.0, 0.04304672100000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.mlp.linear_fc2.bias key (0.0, 0.010941898913151242, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.ls1 key (0.0, 0.05314410000000001, False, False) name module.module.external_feature_model.vit.decoder.layers.17.pre_mlp_layernorm.weight lr_decay_rate 0.4782969000000001 name module.module.external_feature_model.vit.decoder.layers.17.mlp.linear_fc2.weight lr_decay_rate 0.4782969000000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.input_layernorm.bias key (0.0, 0.018530201888518418, False, False) name module.module.external_feature_model.vit.decoder.layers.22.mlp.linear_fc2.bias lr_decay_rate 0.81 name module.module.external_feature_model.vit.decoder.layers.18.mlp.linear_fc2.weight lr_decay_rate 0.531441 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.mlp.linear_fc2.weight key (1.0, 0.05314410000000001, False, False)name module.module.external_feature_model.vit.decoder.layers.15.self_attention.linear_proj.weight lr_decay_rate 0.3874204890000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.mlp.linear_fc2.weight key (1.0, 0.05314410000000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.self_attention.linear_proj.bias key (0.0, 0.007976644307687256, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.mlp.linear_fc2.weight key (1.0, 0.04782969000000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.input_layernorm.weight key (0.0, 0.02058911320946491, False, False)name module.module.external_feature_model.vit.decoder.layers.17.input_layernorm.weight lr_decay_rate 0.4782969000000001 name module.module.external_feature_model.vit.decoder.layers.16.ls2 lr_decay_rate 0.4304672100000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.pre_mlp_layernorm.weight key (0.0, 0.04782969000000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.mlp.linear_fc2.weight key (1.0, 0.05314410000000001, False, False) name module.module.external_feature_model.vit.decoder.layers.18.ls2 lr_decay_rate 0.531441_get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.mlp.linear_fc2.bias key (0.0, 0.08100000000000002, False, False) name module.module.external_feature_model.vit.decoder.layers.4.ls1 lr_decay_rate 0.12157665459056935 name module.module.external_feature_model.vit.decoder.layers.18.mlp.linear_fc2.bias lr_decay_rate 0.531441 name module.module.external_feature_model.vit.decoder.layers.18.mlp.linear_fc2.bias lr_decay_rate 0.531441name module.module.external_feature_model.vit.decoder.layers.8.self_attention.linear_proj.weight lr_decay_rate 0.18530201888518416 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.self_attention.linear_proj.weight key (1.0, 0.03874204890000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.input_layernorm.weight key (0.0, 0.04782969000000001, False, False) name module.module.external_feature_model.vit.decoder.layers.0.self_attention.linear_qkv.weight lr_decay_rate 0.07976644307687256name module.module.external_feature_model.vit.decoder.layers.17.mlp.linear_fc2.bias lr_decay_rate 0.4782969000000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.ls2 key (0.0, 0.04304672100000001, False, False)name module.module.external_feature_model.vit.decoder.layers.9.input_layernorm.bias lr_decay_rate 0.20589113209464907 name module.module.external_feature_model.vit.decoder.layers.17.pre_mlp_layernorm.bias lr_decay_rate 0.4782969000000001name module.module.external_feature_model.vit.decoder.layers.18.mlp.linear_fc2.bias lr_decay_rate 0.531441 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.self_attention.linear_proj.weight key (1.0, 0.018530201888518418, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.ls2 key (0.0, 0.05314410000000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.ls1 key (0.0, 0.012157665459056936, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.mlp.linear_fc2.bias key (0.0, 0.05314410000000001, False, False) name module.module.external_feature_model.vit.decoder.layers.23.ls1 lr_decay_rate 0.9_get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.mlp.linear_fc2.bias key (0.0, 0.05314410000000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.pre_mlp_layernorm.bias key (0.0, 0.04782969000000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.mlp.linear_fc2.bias key (0.0, 0.04782969000000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.input_layernorm.bias key (0.0, 0.02058911320946491, False, False)name module.module.external_feature_model.vit.decoder.layers.17.input_layernorm.bias lr_decay_rate 0.4782969000000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.mlp.linear_fc2.bias key (0.0, 0.05314410000000001, False, False)name module.module.external_feature_model.vit.decoder.layers.15.self_attention.linear_proj.bias lr_decay_rate 0.3874204890000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.self_attention.linear_qkv.weight key (1.0, 0.007976644307687256, False, False) name module.module.external_feature_model.vit.decoder.layers.4.ls2 lr_decay_rate 0.12157665459056935 name module.module.external_feature_model.vit.decoder.layers.16.input_layernorm.weight lr_decay_rate 0.4304672100000001 name module.module.external_feature_model.vit.decoder.layers.8.self_attention.linear_proj.bias lr_decay_rate 0.18530201888518416name module.module.external_feature_model.vit.decoder.layers.18.input_layernorm.weight lr_decay_rate 0.531441 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.ls1 key (0.0, 0.09000000000000001, False, False)name module.module.external_feature_model.vit.decoder.layers.19.ls1 lr_decay_rate 0.5904900000000001 name module.module.external_feature_model.vit.decoder.layers.19.ls1 lr_decay_rate 0.5904900000000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.self_attention.linear_proj.bias key (0.0, 0.03874204890000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.input_layernorm.bias key (0.0, 0.04782969000000001, False, False)name module.module.external_feature_model.vit.decoder.layers.0.self_attention.linear_qkv.bias lr_decay_rate 0.07976644307687256 name module.module.external_feature_model.vit.decoder.layers.17.mlp.linear_fc1.weight lr_decay_rate 0.4782969000000001 name module.module.external_feature_model.vit.decoder.layers.18.ls1 lr_decay_rate 0.531441_get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.input_layernorm.weight key (0.0, 0.04304672100000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.self_attention.linear_proj.bias key (0.0, 0.018530201888518418, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.ls2 key (0.0, 0.012157665459056936, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.input_layernorm.weight key (0.0, 0.05314410000000001, False, False)name module.module.external_feature_model.vit.decoder.layers.9.self_attention.linear_proj.weight lr_decay_rate 0.20589113209464907 name module.module.external_feature_model.vit.decoder.layers.19.ls1 lr_decay_rate 0.5904900000000001name module.module.external_feature_model.vit.class_token lr_decay_rate 1.0 name module.module.external_feature_model.vit.decoder.layers.23.ls2 lr_decay_rate 0.9 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.ls1 key (0.0, 0.05904900000000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.ls1 key (0.0, 0.05904900000000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.self_attention.linear_qkv.bias key (0.0, 0.007976644307687256, False, False) name module.module.external_feature_model.vit.decoder.layers.17.self_attention.linear_proj.weight lr_decay_rate 0.4782969000000001name module.module.external_feature_model.vit.decoder.layers.15.self_attention.linear_qkv.weight lr_decay_rate 0.3874204890000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.mlp.linear_fc1.weight key (1.0, 0.04782969000000001, False, False)name module.module.external_feature_model.vit.decoder.layers.18.input_layernorm.bias lr_decay_rate 0.531441name module.module.external_feature_model.vit.decoder.layers.8.self_attention.linear_qkv.weight lr_decay_rate 0.18530201888518416name module.module.external_feature_model.vit.decoder.layers.16.input_layernorm.bias lr_decay_rate 0.4304672100000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.ls1 key (0.0, 0.05904900000000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.ls1 key (0.0, 0.05314410000000001, False, False) name module.module.external_feature_model.vit.decoder.layers.4.input_layernorm.weight lr_decay_rate 0.12157665459056935 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.self_attention.linear_proj.weight key (1.0, 0.02058911320946491, False, False) name module.module.external_feature_model.vit.decoder.layers.19.ls2 lr_decay_rate 0.5904900000000001name module.module.external_feature_model.vit.decoder.layers.19.ls2 lr_decay_rate 0.5904900000000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.ls2 key (0.0, 0.09000000000000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.input_layernorm.bias key (0.0, 0.04304672100000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.self_attention.linear_proj.weight key (1.0, 0.04782969000000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.self_attention.linear_qkv.weight key (1.0, 0.03874204890000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.self_attention.linear_qkv.weight key (1.0, 0.018530201888518418, False, False)name module.module.external_feature_model.vit.decoder.layers.18.ls2 lr_decay_rate 0.531441name module.module.external_feature_model.vit.decoder.layers.17.mlp.linear_fc1.bias lr_decay_rate 0.4782969000000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.input_layernorm.bias key (0.0, 0.05314410000000001, False, False)name module.module.external_feature_model.vit.decoder.layers.0.pre_mlp_layernorm.weight lr_decay_rate 0.07976644307687256 name module.module.external_feature_model.vit.decoder.layers.19.ls2 lr_decay_rate 0.5904900000000001name module.module.external_feature_model.vit.decoder.layers.9.self_attention.linear_proj.bias lr_decay_rate 0.20589113209464907 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.ls2 key (0.0, 0.05904900000000001, False, False)name module.module.external_feature_model.vit.decoder.layers.17.self_attention.linear_proj.bias lr_decay_rate 0.4782969000000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.input_layernorm.weight key (0.0, 0.012157665459056936, False, False) name module.module.external_feature_model.vit.decoder.layers.16.self_attention.linear_proj.weight lr_decay_rate 0.4304672100000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.ls2 key (0.0, 0.05904900000000001, False, False) name module.module.external_feature_model.vit.decoder.layers.23.input_layernorm.weight lr_decay_rate 0.9 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.ls2 key (0.0, 0.05314410000000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.mlp.linear_fc1.bias key (0.0, 0.04782969000000001, False, False)name module.module.external_feature_model.vit.decoder.layers.15.self_attention.linear_qkv.bias lr_decay_rate 0.3874204890000001name module.module.external_feature_model.vit.decoder.layers.8.self_attention.linear_qkv.bias lr_decay_rate 0.18530201888518416 name module.module.external_feature_model.vit.decoder.layers.4.input_layernorm.bias lr_decay_rate 0.12157665459056935_get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.pre_mlp_layernorm.weight key (0.0, 0.007976644307687256, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.self_attention.linear_proj.weight key (1.0, 0.04304672100000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.ls2 key (0.0, 0.05904900000000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.self_attention.linear_proj.bias key (0.0, 0.02058911320946491, False, False)name module.module.external_feature_model.vit.decoder.layers.18.self_attention.linear_proj.weight lr_decay_rate 0.531441name module.module.external_feature_model.vit.decoder.layers.19.input_layernorm.weight lr_decay_rate 0.5904900000000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.self_attention.linear_proj.bias key (0.0, 0.04782969000000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.input_layernorm.weight key (0.0, 0.09000000000000001, False, False) name module.module.external_feature_model.vit.decoder.layers.18.input_layernorm.weight lr_decay_rate 0.531441 name module.module.external_feature_model.vit.decoder.layers.19.input_layernorm.weight lr_decay_rate 0.5904900000000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.self_attention.linear_qkv.bias key (0.0, 0.03874204890000001, False, False)name module.module.external_feature_model.vit.decoder.layers.17.mlp.linear_fc2.weight lr_decay_rate 0.4782969000000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.self_attention.linear_qkv.bias key (0.0, 0.018530201888518418, False, False)name module.module.external_feature_model.vit.decoder.layers.16.self_attention.linear_proj.bias lr_decay_rate 0.4304672100000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.input_layernorm.bias key (0.0, 0.012157665459056936, False, False) name module.module.external_feature_model.vit.decoder.layers.0.pre_mlp_layernorm.bias lr_decay_rate 0.07976644307687256 name module.module.external_feature_model.vit.decoder.layers.23.input_layernorm.bias lr_decay_rate 0.9_get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.self_attention.linear_proj.weight key (1.0, 0.05314410000000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.input_layernorm.weight key (0.0, 0.05314410000000001, False, False)name module.module.external_feature_model.vit.decoder.layers.19.input_layernorm.weight lr_decay_rate 0.5904900000000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.input_layernorm.weight key (0.0, 0.05904900000000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.input_layernorm.weight key (0.0, 0.05904900000000001, False, False) name module.module.external_feature_model.vit.decoder.layers.9.self_attention.linear_qkv.weight lr_decay_rate 0.20589113209464907 name module.module.external_feature_model.vit.decoder.layers.17.self_attention.linear_qkv.weight lr_decay_rate 0.4782969000000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.self_attention.linear_proj.bias key (0.0, 0.04304672100000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.mlp.linear_fc2.weight key (1.0, 0.04782969000000001, False, False) name module.module.external_feature_model.vit.decoder.layers.15.pre_mlp_layernorm.weight lr_decay_rate 0.3874204890000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.input_layernorm.bias key (0.0, 0.09000000000000001, False, False)name module.module.external_feature_model.vit.decoder.layers.4.self_attention.linear_proj.weight lr_decay_rate 0.12157665459056935 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.pre_mlp_layernorm.bias key (0.0, 0.007976644307687256, False, False)name module.module.external_feature_model.vit.decoder.layers.8.pre_mlp_layernorm.weight lr_decay_rate 0.18530201888518416name module.module.external_feature_model.vit.decoder.layers.18.self_attention.linear_proj.bias lr_decay_rate 0.531441 name module.module.external_feature_model.vit.decoder.layers.19.input_layernorm.bias lr_decay_rate 0.5904900000000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.input_layernorm.weight key (0.0, 0.05904900000000001, False, False) name module.module.external_feature_model.vit.decoder.layers.18.input_layernorm.bias lr_decay_rate 0.531441 name module.module.external_feature_model.vit.decoder.layers.19.input_layernorm.bias lr_decay_rate 0.5904900000000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.self_attention.linear_qkv.weight key (1.0, 0.02058911320946491, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.self_attention.linear_qkv.weight key (1.0, 0.04782969000000001, False, False)name module.module.external_feature_model.vit.decoder.layers.17.mlp.linear_fc2.bias lr_decay_rate 0.4782969000000001name module.module.external_feature_model.vit.decoder.layers.16.self_attention.linear_qkv.weight lr_decay_rate 0.4304672100000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.pre_mlp_layernorm.weight key (0.0, 0.03874204890000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.self_attention.linear_proj.weight key (1.0, 0.012157665459056936, False, False)name module.module.external_feature_model.vit.decoder.layers.19.input_layernorm.bias lr_decay_rate 0.5904900000000001 name module.module.external_feature_model.vit.decoder.layers.23.self_attention.linear_proj.weight lr_decay_rate 0.9_get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.input_layernorm.bias key (0.0, 0.05904900000000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.self_attention.linear_proj.bias key (0.0, 0.05314410000000001, False, False)_get_param_groups name module.module.external_feature_model.vit.class_token key (1.0, 0.1, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.pre_mlp_layernorm.weight key (0.0, 0.018530201888518418, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.input_layernorm.bias key (0.0, 0.05904900000000001, False, False) name module.module.external_feature_model.vit.decoder.layers.0.mlp.linear_fc1.weight lr_decay_rate 0.07976644307687256 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.mlp.linear_fc2.bias key (0.0, 0.04782969000000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.input_layernorm.bias key (0.0, 0.05314410000000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.self_attention.linear_qkv.weight key (1.0, 0.04304672100000001, False, False) name module.module.external_feature_model.vit.decoder.layers.17.self_attention.linear_qkv.bias lr_decay_rate 0.4782969000000001 name module.module.external_feature_model.vit.decoder.layers.9.self_attention.linear_qkv.bias lr_decay_rate 0.20589113209464907 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.input_layernorm.bias key (0.0, 0.05904900000000001, False, False) name module.module.external_feature_model.vit.decoder.layers.15.pre_mlp_layernorm.bias lr_decay_rate 0.3874204890000001 name module.module.external_feature_model.vit.decoder.layers.4.self_attention.linear_proj.bias lr_decay_rate 0.12157665459056935 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.self_attention.linear_proj.weight key (1.0, 0.09000000000000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.mlp.linear_fc1.weight key (1.0, 0.007976644307687256, False, False) name module.module.external_feature_model.vit.decoder.layers.18.self_attention.linear_qkv.weight lr_decay_rate 0.531441name module.module.external_feature_model.vit.decoder.layers.8.pre_mlp_layernorm.bias lr_decay_rate 0.18530201888518416 name module.module.external_feature_model.vit.decoder.layers.19.self_attention.linear_proj.weight lr_decay_rate 0.5904900000000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.pre_mlp_layernorm.bias key (0.0, 0.03874204890000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.self_attention.linear_qkv.bias key (0.0, 0.04782969000000001, False, False)name module.module.external_feature_model.vit.decoder.layers.16.self_attention.linear_qkv.bias lr_decay_rate 0.4304672100000001name module.module.external_feature_model.vit.decoder.layers.18.ls1 lr_decay_rate 0.531441 name module.module.external_feature_model.vit.decoder.layers.19.self_attention.linear_proj.weight lr_decay_rate 0.5904900000000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.self_attention.linear_qkv.bias key (0.0, 0.02058911320946491, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.self_attention.linear_proj.bias key (0.0, 0.012157665459056936, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.pre_mlp_layernorm.bias key (0.0, 0.018530201888518418, False, False)name module.module.external_feature_model.vit.decoder.layers.18.self_attention.linear_proj.weight lr_decay_rate 0.531441name module.module.external_feature_model.vit.conv1.weight lr_decay_rate 0.0717897987691853 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.self_attention.linear_qkv.weight key (1.0, 0.05314410000000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.self_attention.linear_proj.weight key (1.0, 0.05904900000000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.self_attention.linear_qkv.bias key (0.0, 0.04304672100000001, False, False) name module.module.external_feature_model.vit.decoder.layers.23.self_attention.linear_proj.bias lr_decay_rate 0.9name module.module.external_feature_model.vit.decoder.layers.0.mlp.linear_fc1.bias lr_decay_rate 0.07976644307687256 name module.module.external_feature_model.vit.decoder.layers.19.self_attention.linear_proj.weight lr_decay_rate 0.5904900000000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.self_attention.linear_proj.weight key (1.0, 0.05904900000000001, False, False)name module.module.external_feature_model.vit.decoder.layers.15.mlp.linear_fc1.weight lr_decay_rate 0.3874204890000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.ls1 key (0.0, 0.05314410000000001, False, False) name module.module.external_feature_model.vit.decoder.layers.18.self_attention.linear_qkv.bias lr_decay_rate 0.531441name module.module.external_feature_model.vit.decoder.layers.8.mlp.linear_fc1.weight lr_decay_rate 0.18530201888518416 name module.module.external_feature_model.vit.decoder.layers.17.pre_mlp_layernorm.weight lr_decay_rate 0.4782969000000001 name module.module.external_feature_model.vit.decoder.layers.4.self_attention.linear_qkv.weight lr_decay_rate 0.12157665459056935_get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.self_attention.linear_proj.weight key (1.0, 0.05314410000000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.self_attention.linear_proj.bias key (0.0, 0.09000000000000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.mlp.linear_fc1.bias key (0.0, 0.007976644307687256, False, False) name module.module.external_feature_model.vit.decoder.layers.19.self_attention.linear_proj.bias lr_decay_rate 0.5904900000000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.self_attention.linear_proj.weight key (1.0, 0.05904900000000001, False, False)name module.module.external_feature_model.vit.decoder.layers.9.pre_mlp_layernorm.weight lr_decay_rate 0.20589113209464907_get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.self_attention.linear_qkv.bias key (0.0, 0.05314410000000001, False, False)name module.module.external_feature_model.vit.decoder.layers.16.pre_mlp_layernorm.weight lr_decay_rate 0.4304672100000001 _get_param_groups name module.module.external_feature_model.vit.conv1.weight key (1.0, 0.00717897987691853, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.mlp.linear_fc1.weight key (1.0, 0.03874204890000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.self_attention.linear_qkv.weight key (1.0, 0.012157665459056936, False, False) name module.module.external_feature_model.vit.decoder.layers.19.self_attention.linear_proj.bias lr_decay_rate 0.5904900000000001 name module.module.external_feature_model.vit.decoder.layers.18.ls2 lr_decay_rate 0.531441_get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.mlp.linear_fc1.weight key (1.0, 0.018530201888518418, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.pre_mlp_layernorm.weight key (0.0, 0.04782969000000001, False, False) name module.module.external_feature_model.vit.decoder.layers.23.self_attention.linear_qkv.weight lr_decay_rate 0.9 name module.module.external_feature_model.vit.decoder.layers.18.self_attention.linear_proj.bias lr_decay_rate 0.531441name module.module.external_feature_model.vit.decoder.layers.4.self_attention.linear_qkv.bias lr_decay_rate 0.12157665459056935_get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.pre_mlp_layernorm.weight key (0.0, 0.02058911320946491, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.pre_mlp_layernorm.weight key (0.0, 0.04304672100000001, False, False)name module.module.external_feature_model.vit.decoder.layers.0.mlp.linear_fc2.weight lr_decay_rate 0.07976644307687256_get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.self_attention.linear_proj.bias key (0.0, 0.05904900000000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.self_attention.linear_proj.bias key (0.0, 0.05904900000000001, False, False)name module.module.external_feature_model.vit.decoder.layers.15.mlp.linear_fc1.bias lr_decay_rate 0.3874204890000001 name module.module.external_feature_model.vit.decoder.layers.19.self_attention.linear_proj.bias lr_decay_rate 0.5904900000000001 name module.module.external_feature_model.vit.decoder.layers.18.pre_mlp_layernorm.weight lr_decay_rate 0.531441_get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.ls2 key (0.0, 0.05314410000000001, False, False)name module.module.external_feature_model.vit.conv1.bias lr_decay_rate 0.0717897987691853_get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.self_attention.linear_qkv.weight key (1.0, 0.09000000000000001, False, False)name module.module.external_feature_model.vit.decoder.layers.17.pre_mlp_layernorm.bias lr_decay_rate 0.4782969000000001 name module.module.external_feature_model.vit.decoder.layers.8.mlp.linear_fc1.bias lr_decay_rate 0.18530201888518416_get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.self_attention.linear_proj.bias key (0.0, 0.05314410000000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.self_attention.linear_qkv.bias key (0.0, 0.012157665459056936, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.mlp.linear_fc1.bias key (0.0, 0.03874204890000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.self_attention.linear_proj.bias key (0.0, 0.05904900000000001, False, False)name module.module.external_feature_model.vit.decoder.layers.9.pre_mlp_layernorm.bias lr_decay_rate 0.20589113209464907 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.mlp.linear_fc2.weight key (1.0, 0.007976644307687256, False, False) name module.module.external_feature_model.vit.decoder.layers.16.pre_mlp_layernorm.bias lr_decay_rate 0.4304672100000001 name module.module.external_feature_model.vit.decoder.layers.19.self_attention.linear_qkv.weight lr_decay_rate 0.5904900000000001 name module.module.external_feature_model.vit.decoder.layers.19.self_attention.linear_qkv.weight lr_decay_rate 0.5904900000000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.pre_mlp_layernorm.weight key (0.0, 0.05314410000000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.pre_mlp_layernorm.bias key (0.0, 0.04782969000000001, False, False)name module.module.external_feature_model.vit.decoder.layers.23.self_attention.linear_qkv.bias lr_decay_rate 0.9 name module.module.external_feature_model.vit.decoder.layers.18.input_layernorm.weight lr_decay_rate 0.531441 _get_param_groups name module.module.external_feature_model.vit.conv1.bias key (0.0, 0.00717897987691853, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.mlp.linear_fc1.bias key (0.0, 0.018530201888518418, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.pre_mlp_layernorm.bias key (0.0, 0.02058911320946491, False, False)name module.module.external_feature_model.vit.decoder.layers.4.pre_mlp_layernorm.weight lr_decay_rate 0.12157665459056935_get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.self_attention.linear_qkv.weight key (1.0, 0.05904900000000001, False, False)name module.module.external_feature_model.vit.decoder.layers.18.self_attention.linear_qkv.weight lr_decay_rate 0.531441name module.module.external_feature_model.vit.decoder.layers.15.mlp.linear_fc2.weight lr_decay_rate 0.3874204890000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.self_attention.linear_qkv.weight key (1.0, 0.05904900000000001, False, False)name module.module.external_feature_model.vit.decoder.layers.19.self_attention.linear_qkv.weight lr_decay_rate 0.5904900000000001name module.module.external_feature_model.vit.decoder.layers.0.mlp.linear_fc2.bias lr_decay_rate 0.07976644307687256 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.pre_mlp_layernorm.bias key (0.0, 0.04304672100000001, False, False) name module.module.external_feature_model.vit.decoder.layers.17.mlp.linear_fc1.weight lr_decay_rate 0.4782969000000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.self_attention.linear_qkv.bias key (0.0, 0.09000000000000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.input_layernorm.weight key (0.0, 0.05314410000000001, False, False)name module.module.external_feature_model.vit.decoder.layers.18.pre_mlp_layernorm.bias lr_decay_rate 0.531441 name module.module.external_feature_model.vit.decoder.layers.8.mlp.linear_fc2.weight lr_decay_rate 0.18530201888518416_get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.mlp.linear_fc2.bias key (0.0, 0.007976644307687256, False, False)name module.module.external_feature_model.vit.position_embeddings.weight lr_decay_rate 0.0717897987691853 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.pre_mlp_layernorm.weight key (0.0, 0.012157665459056936, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.mlp.linear_fc2.weight key (1.0, 0.03874204890000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.self_attention.linear_qkv.weight key (1.0, 0.05314410000000001, False, False)name module.module.external_feature_model.vit.decoder.layers.19.self_attention.linear_qkv.bias lr_decay_rate 0.5904900000000001name module.module.external_feature_model.vit.decoder.layers.9.mlp.linear_fc1.weight lr_decay_rate 0.20589113209464907 name module.module.external_feature_model.vit.decoder.layers.19.self_attention.linear_qkv.bias lr_decay_rate 0.5904900000000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.self_attention.linear_qkv.weight key (1.0, 0.05904900000000001, False, False) name module.module.external_feature_model.vit.decoder.layers.18.input_layernorm.bias lr_decay_rate 0.531441 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.mlp.linear_fc1.weight key (1.0, 0.04782969000000001, False, False)name module.module.external_feature_model.vit.decoder.layers.16.mlp.linear_fc1.weight lr_decay_rate 0.4304672100000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.pre_mlp_layernorm.bias key (0.0, 0.05314410000000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.mlp.linear_fc2.weight key (1.0, 0.018530201888518418, False, False)name module.module.external_feature_model.vit.decoder.layers.23.pre_mlp_layernorm.weight lr_decay_rate 0.9name module.module.external_feature_model.vit.decoder.layers.1.ls1 lr_decay_rate 0.08862938119652507name module.module.external_feature_model.vit.decoder.layers.4.pre_mlp_layernorm.bias lr_decay_rate 0.12157665459056935_get_param_groups name module.module.external_feature_model.vit.position_embeddings.weight key (1.0, 0.00717897987691853, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.self_attention.linear_qkv.bias key (0.0, 0.05904900000000001, False, False) name module.module.external_feature_model.vit.decoder.layers.18.self_attention.linear_qkv.bias lr_decay_rate 0.531441_get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.self_attention.linear_qkv.bias key (0.0, 0.05904900000000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.input_layernorm.bias key (0.0, 0.05314410000000001, False, False) name module.module.external_feature_model.vit.decoder.layers.15.mlp.linear_fc2.bias lr_decay_rate 0.3874204890000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.mlp.linear_fc1.weight key (1.0, 0.02058911320946491, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.mlp.linear_fc1.weight key (1.0, 0.04304672100000001, False, False) name module.module.external_feature_model.vit.decoder.layers.19.self_attention.linear_qkv.bias lr_decay_rate 0.5904900000000001name module.module.external_feature_model.vit.decoder.layers.8.mlp.linear_fc2.bias lr_decay_rate 0.18530201888518416 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.pre_mlp_layernorm.bias key (0.0, 0.012157665459056936, False, False)name module.module.external_feature_model.vit.decoder.layers.18.mlp.linear_fc1.weight lr_decay_rate 0.531441 name module.module.external_feature_model.vit.decoder.layers.17.mlp.linear_fc1.bias lr_decay_rate 0.4782969000000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.ls1 key (0.0, 0.008862938119652507, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.pre_mlp_layernorm.weight key (0.0, 0.09000000000000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.self_attention.linear_qkv.bias key (0.0, 0.05314410000000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.mlp.linear_fc2.bias key (0.0, 0.03874204890000001, False, False) name module.module.external_feature_model.vit.decoder.layers.19.pre_mlp_layernorm.weight lr_decay_rate 0.5904900000000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.self_attention.linear_qkv.bias key (0.0, 0.05904900000000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.mlp.linear_fc2.bias key (0.0, 0.018530201888518418, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.mlp.linear_fc1.bias key (0.0, 0.04782969000000001, False, False)name module.module.external_feature_model.vit.decoder.layers.18.self_attention.linear_proj.weight lr_decay_rate 0.531441name module.module.external_feature_model.vit.decoder.layers.19.pre_mlp_layernorm.weight lr_decay_rate 0.5904900000000001name module.module.external_feature_model.vit.decoder.layers.9.mlp.linear_fc1.bias lr_decay_rate 0.20589113209464907name module.module.external_feature_model.vit.decoder.layers.0.ls1 lr_decay_rate 0.07976644307687256name module.module.external_feature_model.vit.decoder.layers.16.mlp.linear_fc1.bias lr_decay_rate 0.4304672100000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.mlp.linear_fc1.weight key (1.0, 0.05314410000000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.pre_mlp_layernorm.weight key (0.0, 0.05904900000000001, False, False) name module.module.external_feature_model.vit.decoder.layers.23.pre_mlp_layernorm.bias lr_decay_rate 0.9 name module.module.external_feature_model.vit.decoder.layers.4.mlp.linear_fc1.weight lr_decay_rate 0.12157665459056935name module.module.external_feature_model.vit.decoder.layers.1.ls2 lr_decay_rate 0.08862938119652507 name module.module.external_feature_model.vit.decoder.layers.18.pre_mlp_layernorm.weight lr_decay_rate 0.531441 name module.module.external_feature_model.vit.decoder.layers.16.ls1 lr_decay_rate 0.4304672100000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.mlp.linear_fc1.bias key (0.0, 0.04304672100000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.pre_mlp_layernorm.weight key (0.0, 0.05904900000000001, False, False)name module.module.external_feature_model.vit.decoder.layers.19.pre_mlp_layernorm.weight lr_decay_rate 0.5904900000000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.mlp.linear_fc1.bias key (0.0, 0.02058911320946491, False, False) name module.module.external_feature_model.vit.decoder.layers.17.mlp.linear_fc2.weight lr_decay_rate 0.4782969000000001name module.module.external_feature_model.vit.decoder.layers.19.pre_mlp_layernorm.bias lr_decay_rate 0.5904900000000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.self_attention.linear_proj.weight key (1.0, 0.05314410000000001, False, False)name module.module.external_feature_model.vit.decoder.layers.9.ls1 lr_decay_rate 0.20589113209464907name module.module.external_feature_model.vit.decoder.layers.18.mlp.linear_fc1.bias lr_decay_rate 0.531441_get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.pre_mlp_layernorm.bias key (0.0, 0.09000000000000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.ls1 key (0.0, 0.007976644307687256, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.pre_mlp_layernorm.weight key (0.0, 0.05314410000000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.mlp.linear_fc1.weight key (1.0, 0.012157665459056936, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.pre_mlp_layernorm.weight key (0.0, 0.05904900000000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.ls2 key (0.0, 0.008862938119652507, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.ls1 key (0.0, 0.04304672100000001, False, False)name module.module.external_feature_model.vit.decoder.layers.19.pre_mlp_layernorm.bias lr_decay_rate 0.5904900000000001name module.module.external_feature_model.vit.decoder.layers.16.mlp.linear_fc2.weight lr_decay_rate 0.4304672100000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.mlp.linear_fc2.weight key (1.0, 0.04782969000000001, False, False)name module.module.external_feature_model.vit.decoder.layers.9.mlp.linear_fc2.weight lr_decay_rate 0.20589113209464907 name module.module.external_feature_model.vit.decoder.layers.23.mlp.linear_fc1.weight lr_decay_rate 0.9 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.pre_mlp_layernorm.bias key (0.0, 0.05904900000000001, False, False) name module.module.external_feature_model.vit.decoder.layers.19.pre_mlp_layernorm.bias lr_decay_rate 0.5904900000000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.mlp.linear_fc1.bias key (0.0, 0.05314410000000001, False, False) name module.module.external_feature_model.vit.decoder.layers.4.mlp.linear_fc1.bias lr_decay_rate 0.12157665459056935 name module.module.external_feature_model.vit.decoder.layers.1.input_layernorm.weight lr_decay_rate 0.08862938119652507 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.ls1 key (0.0, 0.02058911320946491, False, False) name module.module.external_feature_model.vit.decoder.layers.18.self_attention.linear_proj.bias lr_decay_rate 0.531441_get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.pre_mlp_layernorm.bias key (0.0, 0.05904900000000001, False, False)name module.module.external_feature_model.vit.decoder.layers.16.ls2 lr_decay_rate 0.4304672100000001name module.module.external_feature_model.vit.decoder.layers.18.pre_mlp_layernorm.bias lr_decay_rate 0.531441 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.mlp.linear_fc2.weight key (1.0, 0.04304672100000001, False, False)name module.module.external_feature_model.vit.decoder.layers.0.ls2 lr_decay_rate 0.07976644307687256 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.pre_mlp_layernorm.bias key (0.0, 0.05904900000000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.mlp.linear_fc2.weight key (1.0, 0.02058911320946491, False, False)name module.module.external_feature_model.vit.decoder.layers.18.mlp.linear_fc2.weight lr_decay_rate 0.531441name module.module.external_feature_model.vit.decoder.layers.17.mlp.linear_fc2.bias lr_decay_rate 0.4782969000000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.mlp.linear_fc1.weight key (1.0, 0.09000000000000001, False, False) name module.module.external_feature_model.vit.decoder.layers.19.mlp.linear_fc1.weight lr_decay_rate 0.5904900000000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.self_attention.linear_proj.bias key (0.0, 0.05314410000000001, False, False) name module.module.external_feature_model.vit.decoder.layers.19.mlp.linear_fc1.weight lr_decay_rate 0.5904900000000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.ls2 key (0.0, 0.04304672100000001, False, False)name module.module.external_feature_model.vit.decoder.layers.9.ls2 lr_decay_rate 0.20589113209464907_get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.mlp.linear_fc1.bias key (0.0, 0.012157665459056936, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.input_layernorm.weight key (0.0, 0.008862938119652507, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.ls2 key (0.0, 0.007976644307687256, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.pre_mlp_layernorm.bias key (0.0, 0.05314410000000001, False, False) name module.module.external_feature_model.vit.decoder.layers.16.mlp.linear_fc2.bias lr_decay_rate 0.4304672100000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.mlp.linear_fc2.weight key (1.0, 0.05314410000000001, False, False)name module.module.external_feature_model.vit.decoder.layers.9.mlp.linear_fc2.bias lr_decay_rate 0.20589113209464907_get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.mlp.linear_fc2.bias key (0.0, 0.04782969000000001, False, False)name module.module.external_feature_model.vit.decoder.layers.19.mlp.linear_fc1.weight lr_decay_rate 0.5904900000000001 name module.module.external_feature_model.vit.decoder.layers.23.mlp.linear_fc1.bias lr_decay_rate 0.9_get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.ls2 key (0.0, 0.02058911320946491, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.mlp.linear_fc1.weight key (1.0, 0.05904900000000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.mlp.linear_fc1.weight key (1.0, 0.05904900000000001, False, False) name module.module.external_feature_model.vit.decoder.layers.18.self_attention.linear_qkv.weight lr_decay_rate 0.531441 name module.module.external_feature_model.vit.decoder.layers.16.input_layernorm.weight lr_decay_rate 0.4304672100000001 name module.module.external_feature_model.vit.decoder.layers.1.input_layernorm.bias lr_decay_rate 0.08862938119652507 name module.module.external_feature_model.vit.decoder.layers.4.mlp.linear_fc2.weight lr_decay_rate 0.12157665459056935name module.module.external_feature_model.vit.decoder.layers.0.input_layernorm.weight lr_decay_rate 0.07976644307687256 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.mlp.linear_fc2.bias key (0.0, 0.04304672100000001, False, False)name module.module.external_feature_model.vit.decoder.layers.18.mlp.linear_fc1.weight lr_decay_rate 0.531441_get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.mlp.linear_fc1.weight key (1.0, 0.05904900000000001, False, False) name module.module.external_feature_model.vit.decoder.layers.9.input_layernorm.weight lr_decay_rate 0.20589113209464907 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.mlp.linear_fc2.bias key (0.0, 0.02058911320946491, False, False)name module.module.external_feature_model.vit.decoder.layers.18.mlp.linear_fc2.bias lr_decay_rate 0.531441_get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.mlp.linear_fc1.bias key (0.0, 0.09000000000000001, False, False) name module.module.external_feature_model.vit.decoder.layers.18.ls1 lr_decay_rate 0.531441name module.module.external_feature_model.vit.decoder.layers.19.mlp.linear_fc1.bias lr_decay_rate 0.5904900000000001name module.module.external_feature_model.vit.decoder.layers.19.mlp.linear_fc1.bias lr_decay_rate 0.5904900000000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.self_attention.linear_qkv.weight key (1.0, 0.05314410000000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.input_layernorm.weight key (0.0, 0.04304672100000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.input_layernorm.bias key (0.0, 0.008862938119652507, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.mlp.linear_fc1.weight key (1.0, 0.05314410000000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.mlp.linear_fc2.weight key (1.0, 0.012157665459056936, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.input_layernorm.weight key (0.0, 0.007976644307687256, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.mlp.linear_fc2.bias key (0.0, 0.05314410000000001, False, False) name module.module.external_feature_model.vit.decoder.layers.19.mlp.linear_fc1.bias lr_decay_rate 0.5904900000000001 name module.module.external_feature_model.vit.decoder.layers.17.ls1 lr_decay_rate 0.4782969000000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.mlp.linear_fc1.bias key (0.0, 0.05904900000000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.input_layernorm.weight key (0.0, 0.02058911320946491, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.mlp.linear_fc1.bias key (0.0, 0.05904900000000001, False, False)name module.module.external_feature_model.vit.decoder.layers.18.self_attention.linear_qkv.bias lr_decay_rate 0.531441 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.ls1 key (0.0, 0.05314410000000001, False, False)name module.module.external_feature_model.vit.decoder.layers.16.input_layernorm.bias lr_decay_rate 0.4304672100000001name module.module.external_feature_model.vit.decoder.layers.23.mlp.linear_fc2.weight lr_decay_rate 0.9name module.module.external_feature_model.vit.decoder.layers.10.ls1 lr_decay_rate 0.2287679245496101 name module.module.external_feature_model.vit.decoder.layers.18.mlp.linear_fc1.bias lr_decay_rate 0.531441 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.mlp.linear_fc1.bias key (0.0, 0.05904900000000001, False, False) name module.module.external_feature_model.vit.decoder.layers.4.mlp.linear_fc2.bias lr_decay_rate 0.12157665459056935 name module.module.external_feature_model.vit.decoder.layers.19.ls1 lr_decay_rate 0.5904900000000001 name module.module.external_feature_model.vit.decoder.layers.1.self_attention.linear_proj.weight lr_decay_rate 0.08862938119652507 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.self_attention.linear_qkv.bias key (0.0, 0.05314410000000001, False, False)name module.module.external_feature_model.vit.decoder.layers.0.input_layernorm.bias lr_decay_rate 0.07976644307687256 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.ls1 key (0.0, 0.04782969000000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.mlp.linear_fc1.bias key (0.0, 0.05314410000000001, False, False) name module.module.external_feature_model.vit.decoder.layers.19.mlp.linear_fc2.weight lr_decay_rate 0.5904900000000001 name module.module.external_feature_model.vit.decoder.layers.9.input_layernorm.bias lr_decay_rate 0.20589113209464907_get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.mlp.linear_fc2.weight key (1.0, 0.09000000000000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.input_layernorm.bias key (0.0, 0.04304672100000001, False, False) name module.module.external_feature_model.vit.decoder.layers.19.mlp.linear_fc2.weight lr_decay_rate 0.5904900000000001name module.module.external_feature_model.vit.decoder.layers.18.ls2 lr_decay_rate 0.531441 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.mlp.linear_fc2.bias key (0.0, 0.012157665459056936, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.ls1 key (0.0, 0.02287679245496101, False, False)name module.module.external_feature_model.vit.decoder.layers.19.mlp.linear_fc2.weight lr_decay_rate 0.5904900000000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.self_attention.linear_proj.weight key (1.0, 0.008862938119652507, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.ls1 key (0.0, 0.05904900000000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.input_layernorm.bias key (0.0, 0.007976644307687256, False, False) name module.module.external_feature_model.vit.decoder.layers.17.ls2 lr_decay_rate 0.4782969000000001 name module.module.external_feature_model.vit.decoder.layers.18.pre_mlp_layernorm.weight lr_decay_rate 0.531441_get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.input_layernorm.bias key (0.0, 0.02058911320946491, False, False)name module.module.external_feature_model.vit.decoder.layers.23.mlp.linear_fc2.bias lr_decay_rate 0.9 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.mlp.linear_fc2.weight key (1.0, 0.05904900000000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.mlp.linear_fc2.weight key (1.0, 0.05904900000000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.ls2 key (0.0, 0.05314410000000001, False, False) name module.module.external_feature_model.vit.decoder.layers.18.mlp.linear_fc2.weight lr_decay_rate 0.531441 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.mlp.linear_fc2.weight key (1.0, 0.05904900000000001, False, False)name module.module.external_feature_model.vit.decoder.layers.10.ls2 lr_decay_rate 0.2287679245496101name module.module.external_feature_model.vit.decoder.layers.1.self_attention.linear_proj.bias lr_decay_rate 0.08862938119652507name module.module.external_feature_model.vit.decoder.layers.19.ls2 lr_decay_rate 0.5904900000000001name module.module.external_feature_model.vit.decoder.layers.5.ls1 lr_decay_rate 0.13508517176729928 name module.module.external_feature_model.vit.decoder.layers.16.self_attention.linear_proj.weight lr_decay_rate 0.4304672100000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.mlp.linear_fc2.weight key (1.0, 0.05314410000000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.ls2 key (0.0, 0.04782969000000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.pre_mlp_layernorm.weight key (0.0, 0.05314410000000001, False, False) name module.module.external_feature_model.vit.decoder.layers.19.mlp.linear_fc2.bias lr_decay_rate 0.5904900000000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.mlp.linear_fc2.bias key (0.0, 0.09000000000000001, False, False)name module.module.external_feature_model.vit.decoder.layers.19.mlp.linear_fc2.bias lr_decay_rate 0.5904900000000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.ls2 key (0.0, 0.05904900000000001, False, False) name module.module.external_feature_model.vit.decoder.layers.18.input_layernorm.weight lr_decay_rate 0.531441 name module.module.external_feature_model.vit.decoder.layers.9.self_attention.linear_proj.weight lr_decay_rate 0.20589113209464907name module.module.external_feature_model.vit.decoder.layers.0.self_attention.linear_proj.weight lr_decay_rate 0.07976644307687256_get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.ls2 key (0.0, 0.02287679245496101, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.self_attention.linear_proj.bias key (0.0, 0.008862938119652507, False, False)name module.module.external_feature_model.vit.decoder.layers.19.mlp.linear_fc2.bias lr_decay_rate 0.5904900000000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.ls1 key (0.0, 0.013508517176729929, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.mlp.linear_fc2.bias key (0.0, 0.05904900000000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.self_attention.linear_proj.weight key (1.0, 0.04304672100000001, False, False)name module.module.external_feature_model.vit.decoder.layers.18.mlp.linear_fc2.bias lr_decay_rate 0.531441name module.module.external_feature_model.vit.decoder.layers.19.input_layernorm.weight lr_decay_rate 0.5904900000000001 name module.module.external_feature_model.vit.decoder.layers.18.pre_mlp_layernorm.bias lr_decay_rate 0.531441 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.mlp.linear_fc2.bias key (0.0, 0.05904900000000001, False, False)name module.module.external_feature_model.vit.decoder.layers.17.input_layernorm.weight lr_decay_rate 0.4782969000000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.self_attention.linear_proj.weight key (1.0, 0.007976644307687256, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.self_attention.linear_proj.weight key (1.0, 0.02058911320946491, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.mlp.linear_fc2.bias key (0.0, 0.05904900000000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.input_layernorm.weight key (0.0, 0.05314410000000001, False, False) _get_param_groups name module.module.external_feature_model.vision_projection.encoder.linear_fc1.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.10.input_layernorm.weight lr_decay_rate 0.2287679245496101name module.module.external_feature_model.vit.decoder.layers.1.self_attention.linear_qkv.weight lr_decay_rate 0.08862938119652507 name module.module.external_feature_model.vit.decoder.layers.5.ls2 lr_decay_rate 0.13508517176729928 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.pre_mlp_layernorm.bias key (0.0, 0.05314410000000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.input_layernorm.weight key (0.0, 0.05904900000000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.mlp.linear_fc2.bias key (0.0, 0.05314410000000001, False, False)name module.module.external_feature_model.vit.decoder.layers.20.ls1 lr_decay_rate 0.6561 name module.module.external_feature_model.vit.decoder.layers.16.self_attention.linear_proj.bias lr_decay_rate 0.4304672100000001 name module.module.external_feature_model.vit.decoder.layers.20.ls1 lr_decay_rate 0.6561 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.input_layernorm.weight key (0.0, 0.04782969000000001, False, False)name module.module.external_feature_model.vit.decoder.layers.18.input_layernorm.bias lr_decay_rate 0.531441name module.module.external_feature_model.vit.decoder.layers.9.self_attention.linear_proj.bias lr_decay_rate 0.20589113209464907name module.module.external_feature_model.vit.decoder.layers.0.self_attention.linear_proj.bias lr_decay_rate 0.07976644307687256 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.ls2 key (0.0, 0.013508517176729929, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.input_layernorm.weight key (0.0, 0.02287679245496101, False, False) name module.module.external_feature_model.vit.decoder.layers.20.ls1 lr_decay_rate 0.6561 _get_param_groups name module.module.external_feature_model.vision_projection.encoder.linear_fc2.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.19.input_layernorm.bias lr_decay_rate 0.5904900000000001name module.module.external_feature_model.vit.decoder.layers.18.mlp.linear_fc1.weight lr_decay_rate 0.531441_get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.ls1 key (0.0, 0.06561, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.self_attention.linear_qkv.weight key (1.0, 0.008862938119652507, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.ls1 key (0.0, 0.06561, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.self_attention.linear_proj.bias key (0.0, 0.04304672100000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.self_attention.linear_proj.bias key (0.0, 0.02058911320946491, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.input_layernorm.bias key (0.0, 0.05314410000000001, False, False)name module.module.external_feature_model.vit.decoder.layers.19.ls1 lr_decay_rate 0.5904900000000001name module.module.external_feature_model.vit.decoder.layers.17.input_layernorm.bias lr_decay_rate 0.4782969000000001 name module.module.external_feature_model.vit.decoder.layers.5.input_layernorm.weight lr_decay_rate 0.13508517176729928 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.ls1 key (0.0, 0.06561, False, False) name module.module.external_feature_model.vit.decoder.layers.1.self_attention.linear_qkv.bias lr_decay_rate 0.08862938119652507_get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.self_attention.linear_proj.bias key (0.0, 0.007976644307687256, False, False) name module.module.external_feature_model.vit.decoder.layers.10.input_layernorm.bias lr_decay_rate 0.2287679245496101name module.module.external_feature_model.vit.decoder.layers.20.ls2 lr_decay_rate 0.6561_get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.mlp.linear_fc1.weight key (1.0, 0.05314410000000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.input_layernorm.bias key (0.0, 0.05904900000000001, False, False) _get_param_groups name module.module.external_feature_model.pre_proj_layernorm.weight key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.16.self_attention.linear_qkv.weight lr_decay_rate 0.4304672100000001 name module.module.external_feature_model.vit.decoder.layers.20.ls2 lr_decay_rate 0.6561name module.module.external_feature_model.vit.decoder.layers.18.self_attention.linear_proj.weight lr_decay_rate 0.531441_get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.ls1 key (0.0, 0.05904900000000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.input_layernorm.bias key (0.0, 0.04782969000000001, False, False)name module.module.external_feature_model.vit.decoder.layers.9.self_attention.linear_qkv.weight lr_decay_rate 0.20589113209464907 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.input_layernorm.weight key (0.0, 0.013508517176729929, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.input_layernorm.bias key (0.0, 0.02287679245496101, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.self_attention.linear_qkv.bias key (0.0, 0.008862938119652507, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.ls2 key (0.0, 0.06561, False, False) name module.module.external_feature_model.vit.decoder.layers.20.ls2 lr_decay_rate 0.6561_get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.ls2 key (0.0, 0.06561, False, False) name module.module.external_feature_model.vit.decoder.layers.0.self_attention.linear_qkv.weight lr_decay_rate 0.07976644307687256name module.module.external_feature_model.vit.decoder.layers.18.mlp.linear_fc1.bias lr_decay_rate 0.531441 _get_param_groups name module.module.external_feature_model.pre_proj_layernorm.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.self_attention.linear_qkv.weight key (1.0, 0.04304672100000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.self_attention.linear_proj.weight key (1.0, 0.05314410000000001, False, False)name module.module.external_feature_model.vit.decoder.layers.19.ls2 lr_decay_rate 0.5904900000000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.self_attention.linear_qkv.weight key (1.0, 0.02058911320946491, False, False) name module.module.external_feature_model.vit.decoder.layers.20.input_layernorm.weight lr_decay_rate 0.6561_get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.mlp.linear_fc1.bias key (0.0, 0.05314410000000001, False, False)name module.module.external_feature_model.vit.decoder.layers.5.input_layernorm.bias lr_decay_rate 0.13508517176729928_get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.self_attention.linear_qkv.weight key (1.0, 0.007976644307687256, False, False) name module.module.external_feature_model.vit.decoder.layers.19.self_attention.linear_proj.weight lr_decay_rate 0.5904900000000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.ls2 key (0.0, 0.06561, False, False) name module.module.external_feature_model.vit.decoder.layers.10.self_attention.linear_proj.weight lr_decay_rate 0.2287679245496101name module.module.external_feature_model.vit.decoder.layers.17.self_attention.linear_proj.weight lr_decay_rate 0.4782969000000001 name module.module.external_feature_model.vit.decoder.layers.16.self_attention.linear_qkv.bias lr_decay_rate 0.4304672100000001_get_param_groups name module.module.embedding.word_embeddings.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.20.input_layernorm.weight lr_decay_rate 0.6561 name module.module.external_feature_model.vit.decoder.layers.1.pre_mlp_layernorm.weight lr_decay_rate 0.08862938119652507 name module.module.external_feature_model.vit.decoder.layers.18.self_attention.linear_proj.bias lr_decay_rate 0.531441 name module.module.external_feature_model.vit.decoder.layers.18.mlp.linear_fc2.weight lr_decay_rate 0.531441 name module.module.external_feature_model.vit.decoder.layers.9.self_attention.linear_qkv.bias lr_decay_rate 0.20589113209464907_get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.input_layernorm.bias key (0.0, 0.013508517176729929, False, False) name module.module.external_feature_model.vit.decoder.layers.0.self_attention.linear_qkv.bias lr_decay_rate 0.07976644307687256_get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.ls2 key (0.0, 0.05904900000000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.input_layernorm.weight key (0.0, 0.06561, False, False) name module.module.external_feature_model.vit.decoder.layers.20.input_layernorm.weight lr_decay_rate 0.6561 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.self_attention.linear_proj.weight key (1.0, 0.05904900000000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.self_attention.linear_proj.weight key (1.0, 0.02287679245496101, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.input_layernorm.weight key (0.0, 0.06561, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.self_attention.linear_proj.weight key (1.0, 0.04782969000000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.self_attention.linear_qkv.bias key (0.0, 0.04304672100000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.self_attention.linear_proj.bias key (0.0, 0.05314410000000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.pre_mlp_layernorm.weight key (0.0, 0.008862938119652507, False, False)_get_param_groups name module.module.decoder.layers.0.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.self_attention.linear_qkv.bias key (0.0, 0.02058911320946491, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.mlp.linear_fc2.weight key (1.0, 0.05314410000000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.input_layernorm.weight key (0.0, 0.06561, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.self_attention.linear_qkv.bias key (0.0, 0.007976644307687256, False, False)name module.module.external_feature_model.vit.decoder.layers.19.input_layernorm.weight lr_decay_rate 0.5904900000000001name module.module.external_feature_model.vit.decoder.layers.20.input_layernorm.bias lr_decay_rate 0.6561 name module.module.external_feature_model.vit.decoder.layers.10.self_attention.linear_proj.bias lr_decay_rate 0.2287679245496101 name module.module.external_feature_model.vit.decoder.layers.5.self_attention.linear_proj.weight lr_decay_rate 0.13508517176729928 name module.module.external_feature_model.vit.decoder.layers.19.self_attention.linear_proj.bias lr_decay_rate 0.5904900000000001 name module.module.external_feature_model.vit.decoder.layers.17.self_attention.linear_proj.bias lr_decay_rate 0.4782969000000001name module.module.external_feature_model.vit.decoder.layers.18.mlp.linear_fc2.bias lr_decay_rate 0.531441name module.module.external_feature_model.vit.decoder.layers.1.pre_mlp_layernorm.bias lr_decay_rate 0.08862938119652507name module.module.external_feature_model.vit.decoder.layers.18.self_attention.linear_qkv.weight lr_decay_rate 0.531441 name module.module.external_feature_model.vit.decoder.layers.16.pre_mlp_layernorm.weight lr_decay_rate 0.4304672100000001 name module.module.external_feature_model.vit.decoder.layers.20.input_layernorm.bias lr_decay_rate 0.6561 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.input_layernorm.bias key (0.0, 0.06561, False, False)name module.module.external_feature_model.vit.decoder.layers.9.pre_mlp_layernorm.weight lr_decay_rate 0.20589113209464907name module.module.external_feature_model.vit.decoder.layers.20.input_layernorm.bias lr_decay_rate 0.6561_get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.self_attention.linear_proj.weight key (1.0, 0.013508517176729929, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.self_attention.linear_qkv.weight key (1.0, 0.05314410000000001, False, False)_get_param_groups name module.module.decoder.layers.0.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.input_layernorm.weight key (0.0, 0.05904900000000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.self_attention.linear_proj.bias key (0.0, 0.02287679245496101, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.pre_mlp_layernorm.bias key (0.0, 0.008862938119652507, False, False) name module.module.external_feature_model.vit.decoder.layers.0.pre_mlp_layernorm.weight lr_decay_rate 0.07976644307687256 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.self_attention.linear_proj.bias key (0.0, 0.05904900000000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.pre_mlp_layernorm.weight key (0.0, 0.04304672100000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.input_layernorm.bias key (0.0, 0.06561, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.self_attention.linear_proj.bias key (0.0, 0.04782969000000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.mlp.linear_fc2.bias key (0.0, 0.05314410000000001, False, False) _get_param_groups name module.module.decoder.layers.0.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.19.input_layernorm.bias lr_decay_rate 0.5904900000000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.pre_mlp_layernorm.weight key (0.0, 0.02058911320946491, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.input_layernorm.bias key (0.0, 0.06561, False, False)name module.module.external_feature_model.vit.decoder.layers.10.self_attention.linear_qkv.weight lr_decay_rate 0.2287679245496101 name module.module.external_feature_model.vit.decoder.layers.18.self_attention.linear_qkv.bias lr_decay_rate 0.531441name module.module.external_feature_model.vit.decoder.layers.5.self_attention.linear_proj.bias lr_decay_rate 0.13508517176729928name module.module.external_feature_model.vit.decoder.layers.20.self_attention.linear_proj.weight lr_decay_rate 0.6561 name module.module.external_feature_model.vit.decoder.layers.16.pre_mlp_layernorm.bias lr_decay_rate 0.4304672100000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.pre_mlp_layernorm.weight key (0.0, 0.007976644307687256, False, False)name module.module.external_feature_model.vit.decoder.layers.1.mlp.linear_fc1.weight lr_decay_rate 0.08862938119652507_get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.input_layernorm.bias key (0.0, 0.05904900000000001, False, False)name module.module.external_feature_model.vit.decoder.layers.19.self_attention.linear_qkv.weight lr_decay_rate 0.5904900000000001 _get_param_groups name module.module.decoder.layers.0.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.9.pre_mlp_layernorm.bias lr_decay_rate 0.20589113209464907name module.module.external_feature_model.vit.decoder.layers.17.self_attention.linear_qkv.weight lr_decay_rate 0.4782969000000001 name module.module.external_feature_model.vit.decoder.layers.19.ls1 lr_decay_rate 0.5904900000000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.self_attention.linear_qkv.bias key (0.0, 0.05314410000000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.self_attention.linear_qkv.weight key (1.0, 0.02287679245496101, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.self_attention.linear_proj.bias key (0.0, 0.013508517176729929, False, False) name module.module.external_feature_model.vit.decoder.layers.20.self_attention.linear_proj.weight lr_decay_rate 0.6561 name module.module.external_feature_model.vit.decoder.layers.20.self_attention.linear_proj.weight lr_decay_rate 0.6561_get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.self_attention.linear_proj.weight key (1.0, 0.06561, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.pre_mlp_layernorm.bias key (0.0, 0.04304672100000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.mlp.linear_fc1.weight key (1.0, 0.008862938119652507, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.pre_mlp_layernorm.bias key (0.0, 0.02058911320946491, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.self_attention.linear_qkv.weight key (1.0, 0.05904900000000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.self_attention.linear_qkv.weight key (1.0, 0.04782969000000001, False, False)name module.module.external_feature_model.vit.decoder.layers.0.pre_mlp_layernorm.bias lr_decay_rate 0.07976644307687256 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.ls1 key (0.0, 0.05904900000000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.self_attention.linear_proj.weight key (1.0, 0.06561, False, False) name module.module.external_feature_model.vit.decoder.layers.19.self_attention.linear_proj.weight lr_decay_rate 0.5904900000000001_get_param_groups name module.module.decoder.layers.0.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.10.self_attention.linear_qkv.bias lr_decay_rate 0.2287679245496101_get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.self_attention.linear_proj.weight key (1.0, 0.06561, False, False) name module.module.external_feature_model.vit.decoder.layers.5.self_attention.linear_qkv.weight lr_decay_rate 0.13508517176729928name module.module.external_feature_model.vit.decoder.layers.18.pre_mlp_layernorm.weight lr_decay_rate 0.531441 name module.module.external_feature_model.vit.decoder.layers.20.self_attention.linear_proj.bias lr_decay_rate 0.6561 name module.module.external_feature_model.vit.decoder.layers.16.mlp.linear_fc1.weight lr_decay_rate 0.4304672100000001name module.module.external_feature_model.vit.decoder.layers.9.mlp.linear_fc1.weight lr_decay_rate 0.20589113209464907 name module.module.external_feature_model.vit.decoder.layers.17.self_attention.linear_qkv.bias lr_decay_rate 0.4782969000000001 name module.module.external_feature_model.vit.decoder.layers.19.self_attention.linear_qkv.bias lr_decay_rate 0.5904900000000001 name module.module.external_feature_model.vit.decoder.layers.1.mlp.linear_fc1.bias lr_decay_rate 0.08862938119652507_get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.pre_mlp_layernorm.bias key (0.0, 0.007976644307687256, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.pre_mlp_layernorm.weight key (0.0, 0.05314410000000001, False, False) name module.module.external_feature_model.vit.decoder.layers.20.self_attention.linear_proj.bias lr_decay_rate 0.6561 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.mlp.linear_fc1.weight key (1.0, 0.02058911320946491, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.self_attention.linear_qkv.weight key (1.0, 0.013508517176729929, False, False)name module.module.external_feature_model.vit.decoder.layers.19.ls2 lr_decay_rate 0.5904900000000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.self_attention.linear_proj.bias key (0.0, 0.06561, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.self_attention.linear_qkv.bias key (0.0, 0.02287679245496101, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.self_attention.linear_proj.weight key (1.0, 0.05904900000000001, False, False)_get_param_groups name module.module.decoder.layers.0.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.self_attention.linear_qkv.bias key (0.0, 0.04782969000000001, False, False) name module.module.external_feature_model.vit.decoder.layers.20.self_attention.linear_proj.bias lr_decay_rate 0.6561_get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.mlp.linear_fc1.weight key (1.0, 0.04304672100000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.self_attention.linear_qkv.bias key (0.0, 0.05904900000000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.mlp.linear_fc1.bias key (0.0, 0.008862938119652507, False, False) name module.module.external_feature_model.vit.decoder.layers.18.pre_mlp_layernorm.bias lr_decay_rate 0.531441 name module.module.external_feature_model.vit.decoder.layers.0.mlp.linear_fc1.weight lr_decay_rate 0.07976644307687256name module.module.external_feature_model.vit.decoder.layers.20.self_attention.linear_qkv.weight lr_decay_rate 0.6561name module.module.external_feature_model.vit.decoder.layers.5.self_attention.linear_qkv.bias lr_decay_rate 0.13508517176729928 name module.module.external_feature_model.vit.decoder.layers.9.mlp.linear_fc1.bias lr_decay_rate 0.20589113209464907name module.module.external_feature_model.vit.decoder.layers.10.pre_mlp_layernorm.weight lr_decay_rate 0.2287679245496101 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.self_attention.linear_proj.bias key (0.0, 0.06561, False, False) name module.module.external_feature_model.vit.decoder.layers.19.self_attention.linear_proj.bias lr_decay_rate 0.5904900000000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.ls2 key (0.0, 0.05904900000000001, False, False) _get_param_groups name module.module.decoder.layers.0.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.self_attention.linear_proj.bias key (0.0, 0.06561, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.pre_mlp_layernorm.bias key (0.0, 0.05314410000000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.self_attention.linear_qkv.weight key (1.0, 0.06561, False, False) name module.module.external_feature_model.vit.decoder.layers.1.mlp.linear_fc2.weight lr_decay_rate 0.08862938119652507name module.module.external_feature_model.vit.decoder.layers.16.mlp.linear_fc1.bias lr_decay_rate 0.4304672100000001 name module.module.external_feature_model.vit.decoder.layers.17.pre_mlp_layernorm.weight lr_decay_rate 0.4782969000000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.pre_mlp_layernorm.weight key (0.0, 0.02287679245496101, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.mlp.linear_fc1.weight key (1.0, 0.007976644307687256, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.self_attention.linear_qkv.bias key (0.0, 0.013508517176729929, False, False) name module.module.external_feature_model.vit.decoder.layers.20.self_attention.linear_qkv.weight lr_decay_rate 0.6561 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.mlp.linear_fc1.bias key (0.0, 0.02058911320946491, False, False)name module.module.external_feature_model.vit.decoder.layers.19.pre_mlp_layernorm.weight lr_decay_rate 0.5904900000000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.self_attention.linear_proj.bias key (0.0, 0.05904900000000001, False, False)name module.module.external_feature_model.vit.decoder.layers.20.self_attention.linear_qkv.weight lr_decay_rate 0.6561_get_param_groups name module.module.decoder.layers.1.input_layernorm.weight key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.19.input_layernorm.weight lr_decay_rate 0.5904900000000001 name module.module.external_feature_model.vit.decoder.layers.20.self_attention.linear_qkv.bias lr_decay_rate 0.6561 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.self_attention.linear_qkv.weight key (1.0, 0.06561, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.mlp.linear_fc2.weight key (1.0, 0.008862938119652507, False, False) name module.module.external_feature_model.vit.decoder.layers.18.mlp.linear_fc1.weight lr_decay_rate 0.531441_get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.pre_mlp_layernorm.weight key (0.0, 0.04782969000000001, False, False)name module.module.external_feature_model.vit.decoder.layers.10.pre_mlp_layernorm.bias lr_decay_rate 0.2287679245496101 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.mlp.linear_fc1.bias key (0.0, 0.04304672100000001, False, False)name module.module.external_feature_model.vit.decoder.layers.5.pre_mlp_layernorm.weight lr_decay_rate 0.13508517176729928 name module.module.external_feature_model.vit.decoder.layers.0.mlp.linear_fc1.bias lr_decay_rate 0.07976644307687256 _get_param_groups name module.module.decoder.layers.1.self_attention.linear_proj.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.19.self_attention.linear_qkv.weight lr_decay_rate 0.5904900000000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.pre_mlp_layernorm.weight key (0.0, 0.05904900000000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.input_layernorm.weight key (0.0, 0.05904900000000001, False, False)name module.module.external_feature_model.vit.decoder.layers.17.pre_mlp_layernorm.bias lr_decay_rate 0.4782969000000001name module.module.external_feature_model.vit.decoder.layers.9.mlp.linear_fc2.weight lr_decay_rate 0.20589113209464907_get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.self_attention.linear_qkv.weight key (1.0, 0.06561, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.mlp.linear_fc1.weight key (1.0, 0.05314410000000001, False, False)name module.module.external_feature_model.vit.decoder.layers.20.self_attention.linear_qkv.bias lr_decay_rate 0.6561 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.self_attention.linear_qkv.bias key (0.0, 0.06561, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.pre_mlp_layernorm.weight key (0.0, 0.013508517176729929, False, False) name module.module.external_feature_model.vit.decoder.layers.16.mlp.linear_fc2.weight lr_decay_rate 0.4304672100000001 name module.module.external_feature_model.vit.decoder.layers.1.mlp.linear_fc2.bias lr_decay_rate 0.08862938119652507 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.pre_mlp_layernorm.bias key (0.0, 0.02287679245496101, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.mlp.linear_fc1.bias key (0.0, 0.007976644307687256, False, False) name module.module.external_feature_model.vit.decoder.layers.19.input_layernorm.bias lr_decay_rate 0.5904900000000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.pre_mlp_layernorm.bias key (0.0, 0.04782969000000001, False, False)_get_param_groups name module.module.decoder.layers.1.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.self_attention.linear_qkv.weight key (1.0, 0.05904900000000001, False, False) name module.module.external_feature_model.vit.decoder.layers.18.mlp.linear_fc1.bias lr_decay_rate 0.531441_get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.mlp.linear_fc2.bias key (0.0, 0.008862938119652507, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.mlp.linear_fc2.weight key (1.0, 0.02058911320946491, False, False)name module.module.external_feature_model.vit.decoder.layers.19.pre_mlp_layernorm.bias lr_decay_rate 0.5904900000000001 name module.module.external_feature_model.vit.decoder.layers.5.pre_mlp_layernorm.bias lr_decay_rate 0.13508517176729928_get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.self_attention.linear_qkv.bias key (0.0, 0.06561, False, False)name module.module.external_feature_model.vit.decoder.layers.20.self_attention.linear_qkv.bias lr_decay_rate 0.6561 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.mlp.linear_fc2.weight key (1.0, 0.04304672100000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.input_layernorm.bias key (0.0, 0.05904900000000001, False, False)name module.module.external_feature_model.vit.decoder.layers.20.pre_mlp_layernorm.weight lr_decay_rate 0.6561name module.module.external_feature_model.vit.decoder.layers.10.mlp.linear_fc1.weight lr_decay_rate 0.2287679245496101 name module.module.external_feature_model.vit.decoder.layers.17.mlp.linear_fc1.weight lr_decay_rate 0.4782969000000001name module.module.external_feature_model.vit.decoder.layers.0.mlp.linear_fc2.weight lr_decay_rate 0.07976644307687256_get_param_groups name module.module.decoder.layers.1.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.19.self_attention.linear_qkv.bias lr_decay_rate 0.5904900000000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.mlp.linear_fc1.bias key (0.0, 0.05314410000000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.pre_mlp_layernorm.bias key (0.0, 0.05904900000000001, False, False)name module.module.external_feature_model.vit.decoder.layers.9.mlp.linear_fc2.bias lr_decay_rate 0.20589113209464907 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.self_attention.linear_qkv.bias key (0.0, 0.06561, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.pre_mlp_layernorm.bias key (0.0, 0.013508517176729929, False, False)name module.module.external_feature_model.vit.decoder.layers.2.ls1 lr_decay_rate 0.09847709021836118name module.module.external_feature_model.vit.decoder.layers.16.mlp.linear_fc2.bias lr_decay_rate 0.4304672100000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.pre_mlp_layernorm.weight key (0.0, 0.06561, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.mlp.linear_fc1.weight key (1.0, 0.02287679245496101, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.mlp.linear_fc1.weight key (1.0, 0.04782969000000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.mlp.linear_fc2.weight key (1.0, 0.007976644307687256, False, False)name module.module.external_feature_model.vit.decoder.layers.20.pre_mlp_layernorm.weight lr_decay_rate 0.6561 name module.module.external_feature_model.vit.decoder.layers.19.self_attention.linear_proj.weight lr_decay_rate 0.5904900000000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.self_attention.linear_qkv.bias key (0.0, 0.05904900000000001, False, False) _get_param_groups name module.module.decoder.layers.1.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.20.pre_mlp_layernorm.bias lr_decay_rate 0.6561 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.mlp.linear_fc2.bias key (0.0, 0.02058911320946491, False, False)name module.module.external_feature_model.vit.decoder.layers.18.mlp.linear_fc2.weight lr_decay_rate 0.531441name module.module.external_feature_model.vit.decoder.layers.19.mlp.linear_fc1.weight lr_decay_rate 0.5904900000000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.pre_mlp_layernorm.weight key (0.0, 0.06561, False, False) name module.module.external_feature_model.vit.decoder.layers.20.pre_mlp_layernorm.weight lr_decay_rate 0.6561 name module.module.external_feature_model.vit.decoder.layers.17.mlp.linear_fc1.bias lr_decay_rate 0.4782969000000001 _get_param_groups name module.module.decoder.layers.1.mlp.linear_fc1.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.0.mlp.linear_fc2.bias lr_decay_rate 0.07976644307687256 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.mlp.linear_fc2.bias key (0.0, 0.04304672100000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.ls1 key (0.0, 0.00984770902183612, False, False) name module.module.external_feature_model.vit.decoder.layers.5.mlp.linear_fc1.weight lr_decay_rate 0.13508517176729928 name module.module.external_feature_model.vit.decoder.layers.10.mlp.linear_fc1.bias lr_decay_rate 0.2287679245496101_get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.self_attention.linear_proj.weight key (1.0, 0.05904900000000001, False, False) _get_param_groups name module.module.decoder.layers.1.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.pre_mlp_layernorm.bias key (0.0, 0.06561, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.pre_mlp_layernorm.weight key (0.0, 0.06561, False, False)name module.module.external_feature_model.vit.decoder.layers.19.pre_mlp_layernorm.weight lr_decay_rate 0.5904900000000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.mlp.linear_fc1.bias key (0.0, 0.04782969000000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.mlp.linear_fc2.bias key (0.0, 0.007976644307687256, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.mlp.linear_fc2.weight key (1.0, 0.05314410000000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.mlp.linear_fc1.weight key (1.0, 0.05904900000000001, False, False) name module.module.external_feature_model.vit.decoder.layers.20.pre_mlp_layernorm.bias lr_decay_rate 0.6561 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.mlp.linear_fc1.weight key (1.0, 0.013508517176729929, False, False)name module.module.external_feature_model.vit.decoder.layers.2.ls2 lr_decay_rate 0.09847709021836118 name module.module.external_feature_model.vit.decoder.layers.10.ls1 lr_decay_rate 0.2287679245496101 _get_param_groups name module.module.decoder.layers.2.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.mlp.linear_fc1.bias key (0.0, 0.02287679245496101, False, False)name module.module.external_feature_model.vit.decoder.layers.17.ls1 lr_decay_rate 0.4782969000000001name module.module.external_feature_model.vit.decoder.layers.20.mlp.linear_fc1.weight lr_decay_rate 0.6561name module.module.external_feature_model.vit.decoder.layers.19.self_attention.linear_proj.bias lr_decay_rate 0.5904900000000001 name module.module.external_feature_model.vit.decoder.layers.18.mlp.linear_fc2.bias lr_decay_rate 0.531441name module.module.external_feature_model.vit.decoder.layers.17.mlp.linear_fc2.weight lr_decay_rate 0.4782969000000001name module.module.external_feature_model.vit.decoder.layers.20.pre_mlp_layernorm.bias lr_decay_rate 0.6561 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.ls2 key (0.0, 0.00984770902183612, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.pre_mlp_layernorm.weight key (0.0, 0.05904900000000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.pre_mlp_layernorm.bias key (0.0, 0.06561, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.ls1 key (0.0, 0.02287679245496101, False, False) name module.module.external_feature_model.vit.decoder.layers.19.mlp.linear_fc1.bias lr_decay_rate 0.5904900000000001 name module.module.external_feature_model.vit.decoder.layers.5.mlp.linear_fc1.bias lr_decay_rate 0.13508517176729928 name module.module.external_feature_model.vit.decoder.layers.10.mlp.linear_fc2.weight lr_decay_rate 0.2287679245496101 name module.module.external_feature_model.vit.decoder.layers.1.ls1 lr_decay_rate 0.08862938119652507_get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.mlp.linear_fc1.weight key (1.0, 0.06561, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.self_attention.linear_proj.bias key (0.0, 0.05904900000000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.ls1 key (0.0, 0.04782969000000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.pre_mlp_layernorm.bias key (0.0, 0.06561, False, False)_get_param_groups name module.module.decoder.layers.2.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.mlp.linear_fc2.bias key (0.0, 0.05314410000000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.mlp.linear_fc2.weight key (1.0, 0.04782969000000001, False, False) name module.module.external_feature_model.vit.decoder.layers.10.ls2 lr_decay_rate 0.2287679245496101name module.module.external_feature_model.vit.decoder.layers.2.input_layernorm.weight lr_decay_rate 0.09847709021836118 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.mlp.linear_fc2.weight key (1.0, 0.02287679245496101, False, False) name module.module.external_feature_model.vit.decoder.layers.19.pre_mlp_layernorm.bias lr_decay_rate 0.5904900000000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.mlp.linear_fc1.bias key (0.0, 0.05904900000000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.mlp.linear_fc1.bias key (0.0, 0.013508517176729929, False, False)name module.module.external_feature_model.vit.decoder.layers.20.mlp.linear_fc1.weight lr_decay_rate 0.6561 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.ls1 key (0.0, 0.008862938119652507, False, False) name module.module.external_feature_model.vit.decoder.layers.20.mlp.linear_fc1.bias lr_decay_rate 0.6561 name module.module.external_feature_model.vit.decoder.layers.19.self_attention.linear_qkv.weight lr_decay_rate 0.5904900000000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.pre_mlp_layernorm.bias key (0.0, 0.05904900000000001, False, False)_get_param_groups name module.module.decoder.layers.2.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.17.ls2 lr_decay_rate 0.4782969000000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.ls2 key (0.0, 0.02287679245496101, False, False)name module.module.external_feature_model.vit.decoder.layers.20.mlp.linear_fc1.weight lr_decay_rate 0.6561_get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.input_layernorm.weight key (0.0, 0.00984770902183612, False, False)name module.module.external_feature_model.vit.decoder.layers.17.mlp.linear_fc2.bias lr_decay_rate 0.4782969000000001name module.module.external_feature_model.vit.decoder.layers.19.ls1 lr_decay_rate 0.5904900000000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.mlp.linear_fc1.weight key (1.0, 0.06561, False, False) name module.module.external_feature_model.vit.decoder.layers.10.mlp.linear_fc2.bias lr_decay_rate 0.2287679245496101_get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.mlp.linear_fc1.bias key (0.0, 0.06561, False, False) name module.module.external_feature_model.vit.decoder.layers.5.mlp.linear_fc2.weight lr_decay_rate 0.13508517176729928 name module.module.external_feature_model.vit.decoder.layers.19.mlp.linear_fc2.weight lr_decay_rate 0.5904900000000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.self_attention.linear_qkv.weight key (1.0, 0.05904900000000001, False, False)name module.module.external_feature_model.vit.decoder.layers.1.ls2 lr_decay_rate 0.08862938119652507 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.ls2 key (0.0, 0.04782969000000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.mlp.linear_fc2.bias key (0.0, 0.04782969000000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.mlp.linear_fc1.weight key (1.0, 0.06561, False, False) _get_param_groups name module.module.decoder.layers.2.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.ls1 key (0.0, 0.05904900000000001, False, False) name module.module.external_feature_model.vit.decoder.layers.19.mlp.linear_fc1.weight lr_decay_rate 0.5904900000000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.mlp.linear_fc2.bias key (0.0, 0.02287679245496101, False, False) name module.module.external_feature_model.vit.decoder.layers.2.input_layernorm.bias lr_decay_rate 0.09847709021836118 name module.module.external_feature_model.vit.decoder.layers.10.input_layernorm.weight lr_decay_rate 0.2287679245496101 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.mlp.linear_fc2.weight key (1.0, 0.05904900000000001, False, False) name module.module.external_feature_model.vit.decoder.layers.20.mlp.linear_fc1.bias lr_decay_rate 0.6561 name module.module.external_feature_model.vit.decoder.layers.20.mlp.linear_fc2.weight lr_decay_rate 0.6561_get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.mlp.linear_fc2.weight key (1.0, 0.013508517176729929, False, False) name module.module.external_feature_model.vit.decoder.layers.19.self_attention.linear_qkv.bias lr_decay_rate 0.5904900000000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.ls2 key (0.0, 0.008862938119652507, False, False) name module.module.external_feature_model.vit.decoder.layers.17.input_layernorm.weight lr_decay_rate 0.4782969000000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.mlp.linear_fc1.bias key (0.0, 0.06561, False, False)name module.module.external_feature_model.vit.decoder.layers.18.ls1 lr_decay_rate 0.531441name module.module.external_feature_model.vit.decoder.layers.20.mlp.linear_fc1.bias lr_decay_rate 0.6561name module.module.external_feature_model.vit.decoder.layers.19.mlp.linear_fc2.bias lr_decay_rate 0.5904900000000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.input_layernorm.bias key (0.0, 0.00984770902183612, False, False) name module.module.external_feature_model.vit.decoder.layers.19.ls2 lr_decay_rate 0.5904900000000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.mlp.linear_fc1.weight key (1.0, 0.05904900000000001, False, False) _get_param_groups name module.module.decoder.layers.2.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.mlp.linear_fc2.weight key (1.0, 0.06561, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.input_layernorm.weight key (0.0, 0.02287679245496101, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.self_attention.linear_qkv.bias key (0.0, 0.05904900000000001, False, False) name module.module.external_feature_model.vit.decoder.layers.1.input_layernorm.weight lr_decay_rate 0.08862938119652507name module.module.external_feature_model.vit.decoder.layers.11.ls1 lr_decay_rate 0.2541865828329001name module.module.external_feature_model.vit.decoder.layers.5.mlp.linear_fc2.bias lr_decay_rate 0.13508517176729928_get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.input_layernorm.weight key (0.0, 0.04782969000000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.mlp.linear_fc2.bias key (0.0, 0.05904900000000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.ls2 key (0.0, 0.05904900000000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.mlp.linear_fc1.bias key (0.0, 0.06561, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.ls1 key (0.0, 0.05314410000000001, False, False)name module.module.external_feature_model.vit.decoder.layers.20.mlp.linear_fc2.weight lr_decay_rate 0.6561 _get_param_groups name module.module.decoder.layers.2.mlp.linear_fc1.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.20.mlp.linear_fc2.bias lr_decay_rate 0.6561name module.module.external_feature_model.vit.decoder.layers.19.mlp.linear_fc1.bias lr_decay_rate 0.5904900000000001name module.module.external_feature_model.vit.decoder.layers.2.self_attention.linear_proj.weight lr_decay_rate 0.09847709021836118 name module.module.external_feature_model.vit.decoder.layers.10.input_layernorm.bias lr_decay_rate 0.2287679245496101 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.mlp.linear_fc2.bias key (0.0, 0.013508517176729929, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.input_layernorm.weight key (0.0, 0.008862938119652507, False, False)name module.module.external_feature_model.vit.decoder.layers.19.pre_mlp_layernorm.weight lr_decay_rate 0.5904900000000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.ls1 key (0.0, 0.02541865828329001, False, False) name module.module.external_feature_model.vit.decoder.layers.20.ls1 lr_decay_rate 0.6561 name module.module.external_feature_model.vit.decoder.layers.17.input_layernorm.bias lr_decay_rate 0.4782969000000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.mlp.linear_fc1.bias key (0.0, 0.05904900000000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.mlp.linear_fc2.weight key (1.0, 0.06561, False, False)name module.module.external_feature_model.vit.decoder.layers.20.mlp.linear_fc2.weight lr_decay_rate 0.6561name module.module.external_feature_model.vit.decoder.layers.19.input_layernorm.weight lr_decay_rate 0.5904900000000001 name module.module.external_feature_model.vit.decoder.layers.18.ls2 lr_decay_rate 0.531441 _get_param_groups name module.module.decoder.layers.2.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.mlp.linear_fc2.bias key (0.0, 0.06561, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.self_attention.linear_proj.weight key (1.0, 0.00984770902183612, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.input_layernorm.bias key (0.0, 0.02287679245496101, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.pre_mlp_layernorm.weight key (0.0, 0.05904900000000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.input_layernorm.bias key (0.0, 0.04782969000000001, False, False) name module.module.external_feature_model.vit.decoder.layers.6.ls1 lr_decay_rate 0.15009463529699918_get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.mlp.linear_fc2.weight key (1.0, 0.06561, False, False)name module.module.external_feature_model.vit.decoder.layers.1.input_layernorm.bias lr_decay_rate 0.08862938119652507name module.module.external_feature_model.vit.decoder.layers.11.ls2 lr_decay_rate 0.2541865828329001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.ls2 key (0.0, 0.05314410000000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.ls1 key (0.0, 0.06561, False, False) name module.module.external_feature_model.vit.decoder.layers.2.self_attention.linear_proj.bias lr_decay_rate 0.09847709021836118name module.module.external_feature_model.vit.decoder.layers.20.mlp.linear_fc2.bias lr_decay_rate 0.6561 name module.module.external_feature_model.vit.decoder.layers.19.pre_mlp_layernorm.bias lr_decay_rate 0.5904900000000001name module.module.external_feature_model.vit.decoder.layers.19.mlp.linear_fc2.weight lr_decay_rate 0.5904900000000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.input_layernorm.weight key (0.0, 0.05904900000000001, False, False)_get_param_groups name module.module.decoder.layers.3.input_layernorm.weight key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.10.self_attention.linear_proj.weight lr_decay_rate 0.2287679245496101 name module.module.external_feature_model.vit.decoder.layers.21.ls1 lr_decay_rate 0.7290000000000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.ls1 key (0.0, 0.015009463529699918, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.input_layernorm.bias key (0.0, 0.008862938119652507, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.ls2 key (0.0, 0.02541865828329001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.self_attention.linear_proj.bias key (0.0, 0.00984770902183612, False, False) name module.module.external_feature_model.vit.decoder.layers.20.mlp.linear_fc2.bias lr_decay_rate 0.6561name module.module.external_feature_model.vit.decoder.layers.18.input_layernorm.weight lr_decay_rate 0.531441 name module.module.external_feature_model.vit.decoder.layers.17.self_attention.linear_proj.weight lr_decay_rate 0.4782969000000001 name module.module.external_feature_model.vit.decoder.layers.20.ls2 lr_decay_rate 0.6561_get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.mlp.linear_fc2.weight key (1.0, 0.05904900000000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.mlp.linear_fc2.bias key (0.0, 0.06561, False, False) name module.module.external_feature_model.vit.decoder.layers.19.input_layernorm.bias lr_decay_rate 0.5904900000000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.pre_mlp_layernorm.bias key (0.0, 0.05904900000000001, False, False) _get_param_groups name module.module.decoder.layers.3.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.self_attention.linear_proj.weight key (1.0, 0.02287679245496101, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.ls1 key (0.0, 0.0729, False, False)name module.module.external_feature_model.vit.decoder.layers.6.ls2 lr_decay_rate 0.15009463529699918 name module.module.external_feature_model.vit.decoder.layers.11.input_layernorm.weight lr_decay_rate 0.2541865828329001name module.module.external_feature_model.vit.decoder.layers.1.self_attention.linear_proj.weight lr_decay_rate 0.08862938119652507 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.mlp.linear_fc2.bias key (0.0, 0.06561, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.input_layernorm.weight key (0.0, 0.05314410000000001, False, False)name module.module.external_feature_model.vit.decoder.layers.2.self_attention.linear_qkv.weight lr_decay_rate 0.09847709021836118_get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.ls2 key (0.0, 0.06561, False, False) name module.module.external_feature_model.vit.decoder.layers.21.ls1 lr_decay_rate 0.7290000000000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.self_attention.linear_proj.weight key (1.0, 0.04782969000000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.input_layernorm.bias key (0.0, 0.05904900000000001, False, False)_get_param_groups name module.module.decoder.layers.3.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.19.mlp.linear_fc2.bias lr_decay_rate 0.5904900000000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.ls2 key (0.0, 0.015009463529699918, False, False)name module.module.external_feature_model.vit.decoder.layers.10.self_attention.linear_proj.bias lr_decay_rate 0.2287679245496101name module.module.external_feature_model.vit.decoder.layers.19.mlp.linear_fc1.weight lr_decay_rate 0.5904900000000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.self_attention.linear_qkv.weight key (1.0, 0.00984770902183612, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.input_layernorm.weight key (0.0, 0.02541865828329001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.ls1 key (0.0, 0.0729, False, False) name module.module.external_feature_model.vit.decoder.layers.21.ls2 lr_decay_rate 0.7290000000000001name module.module.external_feature_model.vit.decoder.layers.18.input_layernorm.bias lr_decay_rate 0.531441 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.self_attention.linear_proj.weight key (1.0, 0.008862938119652507, False, False)name module.module.external_feature_model.vit.decoder.layers.20.input_layernorm.weight lr_decay_rate 0.6561 _get_param_groups name module.module.decoder.layers.3.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.mlp.linear_fc1.weight key (1.0, 0.05904900000000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.self_attention.linear_proj.bias key (0.0, 0.02287679245496101, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.mlp.linear_fc2.bias key (0.0, 0.05904900000000001, False, False)name module.module.external_feature_model.vit.decoder.layers.21.ls1 lr_decay_rate 0.7290000000000001 name module.module.external_feature_model.vit.decoder.layers.17.self_attention.linear_proj.bias lr_decay_rate 0.4782969000000001 name module.module.external_feature_model.vit.decoder.layers.19.self_attention.linear_proj.weight lr_decay_rate 0.5904900000000001 name module.module.external_feature_model.vit.decoder.layers.6.input_layernorm.weight lr_decay_rate 0.15009463529699918name module.module.external_feature_model.vit.decoder.layers.2.self_attention.linear_qkv.bias lr_decay_rate 0.09847709021836118 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.input_layernorm.bias key (0.0, 0.05314410000000001, False, False)name module.module.external_feature_model.vit.decoder.layers.11.input_layernorm.bias lr_decay_rate 0.2541865828329001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.ls2 key (0.0, 0.0729, False, False) name module.module.external_feature_model.vit.decoder.layers.21.ls2 lr_decay_rate 0.7290000000000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.input_layernorm.weight key (0.0, 0.06561, False, False) name module.module.external_feature_model.vit.decoder.layers.1.self_attention.linear_proj.bias lr_decay_rate 0.08862938119652507 name module.module.external_feature_model.vit.decoder.layers.19.mlp.linear_fc1.bias lr_decay_rate 0.5904900000000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.self_attention.linear_proj.bias key (0.0, 0.04782969000000001, False, False) name module.module.external_feature_model.vit.decoder.layers.10.self_attention.linear_qkv.weight lr_decay_rate 0.2287679245496101_get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.ls1 key (0.0, 0.0729, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.input_layernorm.weight key (0.0, 0.015009463529699918, False, False)_get_param_groups name module.module.decoder.layers.3.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.20.ls1 lr_decay_rate 0.6561 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.self_attention.linear_proj.weight key (1.0, 0.05904900000000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.input_layernorm.bias key (0.0, 0.02541865828329001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.self_attention.linear_qkv.bias key (0.0, 0.00984770902183612, False, False) name module.module.external_feature_model.vit.decoder.layers.21.input_layernorm.weight lr_decay_rate 0.7290000000000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.mlp.linear_fc1.bias key (0.0, 0.05904900000000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.self_attention.linear_proj.bias key (0.0, 0.008862938119652507, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.ls2 key (0.0, 0.0729, False, False) name module.module.external_feature_model.vit.decoder.layers.20.input_layernorm.bias lr_decay_rate 0.6561name module.module.external_feature_model.vit.decoder.layers.18.self_attention.linear_proj.weight lr_decay_rate 0.531441 name module.module.external_feature_model.vit.decoder.layers.17.self_attention.linear_qkv.weight lr_decay_rate 0.4782969000000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.input_layernorm.weight key (0.0, 0.0729, False, False)name module.module.external_feature_model.vit.decoder.layers.21.ls2 lr_decay_rate 0.7290000000000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.self_attention.linear_qkv.weight key (1.0, 0.02287679245496101, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.ls1 key (0.0, 0.06561, False, False)_get_param_groups name module.module.decoder.layers.3.mlp.linear_fc1.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.19.self_attention.linear_proj.bias lr_decay_rate 0.5904900000000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.self_attention.linear_proj.weight key (1.0, 0.05314410000000001, False, False) name module.module.external_feature_model.vit.decoder.layers.6.input_layernorm.bias lr_decay_rate 0.15009463529699918 name module.module.external_feature_model.vit.decoder.layers.1.self_attention.linear_qkv.weight lr_decay_rate 0.08862938119652507 name module.module.external_feature_model.vit.decoder.layers.19.mlp.linear_fc2.weight lr_decay_rate 0.5904900000000001name module.module.external_feature_model.vit.decoder.layers.11.self_attention.linear_proj.weight lr_decay_rate 0.2541865828329001 name module.module.external_feature_model.vit.decoder.layers.2.pre_mlp_layernorm.weight lr_decay_rate 0.09847709021836118_get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.input_layernorm.bias key (0.0, 0.06561, False, False) name module.module.external_feature_model.vit.decoder.layers.21.input_layernorm.weight lr_decay_rate 0.7290000000000001 name module.module.external_feature_model.vit.decoder.layers.20.ls2 lr_decay_rate 0.6561_get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.self_attention.linear_qkv.weight key (1.0, 0.04782969000000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.mlp.linear_fc2.weight key (1.0, 0.05904900000000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.ls2 key (0.0, 0.0729, False, False)_get_param_groups name module.module.decoder.layers.3.mlp.linear_fc2.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.21.input_layernorm.bias lr_decay_rate 0.7290000000000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.input_layernorm.bias key (0.0, 0.015009463529699918, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.self_attention.linear_qkv.weight key (1.0, 0.008862938119652507, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.self_attention.linear_proj.bias key (0.0, 0.05904900000000001, False, False)name module.module.external_feature_model.vit.decoder.layers.10.self_attention.linear_qkv.bias lr_decay_rate 0.2287679245496101 name module.module.external_feature_model.vit.decoder.layers.20.self_attention.linear_proj.weight lr_decay_rate 0.6561_get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.ls2 key (0.0, 0.06561, False, False)name module.module.external_feature_model.vit.decoder.layers.18.self_attention.linear_proj.bias lr_decay_rate 0.531441 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.input_layernorm.weight key (0.0, 0.0729, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.self_attention.linear_proj.weight key (1.0, 0.02541865828329001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.pre_mlp_layernorm.weight key (0.0, 0.00984770902183612, False, False) name module.module.external_feature_model.vit.decoder.layers.17.self_attention.linear_qkv.bias lr_decay_rate 0.4782969000000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.input_layernorm.bias key (0.0, 0.0729, False, False) _get_param_groups name module.module.decoder.layers.4.input_layernorm.weight key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.6.self_attention.linear_proj.weight lr_decay_rate 0.15009463529699918 name module.module.external_feature_model.vit.decoder.layers.19.mlp.linear_fc2.bias lr_decay_rate 0.5904900000000001name module.module.external_feature_model.vit.decoder.layers.21.input_layernorm.weight lr_decay_rate 0.7290000000000001name module.module.external_feature_model.vit.decoder.layers.1.self_attention.linear_qkv.bias lr_decay_rate 0.08862938119652507 name module.module.external_feature_model.vit.decoder.layers.19.self_attention.linear_qkv.weight lr_decay_rate 0.5904900000000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.self_attention.linear_qkv.bias key (0.0, 0.02287679245496101, False, False) name module.module.external_feature_model.vit.decoder.layers.20.input_layernorm.weight lr_decay_rate 0.6561_get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.self_attention.linear_qkv.bias key (0.0, 0.04782969000000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.self_attention.linear_proj.weight key (1.0, 0.06561, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.self_attention.linear_proj.bias key (0.0, 0.05314410000000001, False, False) name module.module.external_feature_model.vit.decoder.layers.21.input_layernorm.bias lr_decay_rate 0.7290000000000001name module.module.external_feature_model.vit.decoder.layers.11.self_attention.linear_proj.bias lr_decay_rate 0.2541865828329001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.mlp.linear_fc2.bias key (0.0, 0.05904900000000001, False, False) name module.module.external_feature_model.vit.decoder.layers.2.pre_mlp_layernorm.bias lr_decay_rate 0.09847709021836118 _get_param_groups name module.module.decoder.layers.4.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.self_attention.linear_proj.weight key (1.0, 0.015009463529699918, False, False) name module.module.external_feature_model.vit.decoder.layers.21.self_attention.linear_proj.weight lr_decay_rate 0.7290000000000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.input_layernorm.weight key (0.0, 0.06561, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.self_attention.linear_proj.bias key (0.0, 0.02541865828329001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.input_layernorm.weight key (0.0, 0.0729, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.self_attention.linear_qkv.bias key (0.0, 0.008862938119652507, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.self_attention.linear_qkv.weight key (1.0, 0.05904900000000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.input_layernorm.bias key (0.0, 0.0729, False, False)name module.module.external_feature_model.vit.decoder.layers.20.self_attention.linear_proj.bias lr_decay_rate 0.6561 name module.module.external_feature_model.vit.decoder.layers.10.pre_mlp_layernorm.weight lr_decay_rate 0.2287679245496101_get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.pre_mlp_layernorm.bias key (0.0, 0.00984770902183612, False, False)name module.module.external_feature_model.vit.decoder.layers.17.pre_mlp_layernorm.weight lr_decay_rate 0.4782969000000001 name module.module.external_feature_model.vit.decoder.layers.18.self_attention.linear_qkv.weight lr_decay_rate 0.531441name module.module.external_feature_model.vit.decoder.layers.20.ls1 lr_decay_rate 0.6561 name module.module.external_feature_model.vit.decoder.layers.6.self_attention.linear_proj.bias lr_decay_rate 0.15009463529699918 _get_param_groups name module.module.decoder.layers.4.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.11.self_attention.linear_qkv.weight lr_decay_rate 0.2541865828329001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.self_attention.linear_proj.weight key (1.0, 0.0729, False, False) name module.module.external_feature_model.vit.decoder.layers.20.input_layernorm.bias lr_decay_rate 0.6561name module.module.external_feature_model.vit.decoder.layers.21.input_layernorm.bias lr_decay_rate 0.7290000000000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.self_attention.linear_proj.bias key (0.0, 0.06561, False, False)name module.module.external_feature_model.vit.decoder.layers.19.self_attention.linear_qkv.bias lr_decay_rate 0.5904900000000001 name module.module.external_feature_model.vit.decoder.layers.21.self_attention.linear_proj.weight lr_decay_rate 0.7290000000000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.ls1 key (0.0, 0.06561, False, False) name module.module.external_feature_model.vit.decoder.layers.1.pre_mlp_layernorm.weight lr_decay_rate 0.08862938119652507_get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.pre_mlp_layernorm.weight key (0.0, 0.02287679245496101, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.pre_mlp_layernorm.weight key (0.0, 0.04782969000000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.self_attention.linear_qkv.weight key (1.0, 0.05314410000000001, False, False)name module.module.external_feature_model.vit.decoder.layers.2.mlp.linear_fc1.weight lr_decay_rate 0.09847709021836118 name module.module.external_feature_model.vit.decoder.layers.21.self_attention.linear_proj.bias lr_decay_rate 0.7290000000000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.self_attention.linear_proj.bias key (0.0, 0.015009463529699918, False, False) _get_param_groups name module.module.decoder.layers.4.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.self_attention.linear_qkv.weight key (1.0, 0.02541865828329001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.input_layernorm.bias key (0.0, 0.06561, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.self_attention.linear_qkv.bias key (0.0, 0.05904900000000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.input_layernorm.bias key (0.0, 0.0729, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.self_attention.linear_proj.weight key (1.0, 0.0729, False, False) name module.module.external_feature_model.vit.decoder.layers.20.self_attention.linear_qkv.weight lr_decay_rate 0.6561 name module.module.external_feature_model.vit.decoder.layers.20.ls2 lr_decay_rate 0.6561 name module.module.external_feature_model.vit.decoder.layers.10.pre_mlp_layernorm.bias lr_decay_rate 0.2287679245496101_get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.pre_mlp_layernorm.weight key (0.0, 0.008862938119652507, False, False) name module.module.external_feature_model.vit.decoder.layers.18.self_attention.linear_qkv.bias lr_decay_rate 0.531441_get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.mlp.linear_fc1.weight key (1.0, 0.00984770902183612, False, False)name module.module.external_feature_model.vit.decoder.layers.17.pre_mlp_layernorm.bias lr_decay_rate 0.4782969000000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.self_attention.linear_proj.bias key (0.0, 0.0729, False, False) name module.module.external_feature_model.vit.decoder.layers.6.self_attention.linear_qkv.weight lr_decay_rate 0.15009463529699918 name module.module.external_feature_model.vit.decoder.layers.11.self_attention.linear_qkv.bias lr_decay_rate 0.2541865828329001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.ls2 key (0.0, 0.06561, False, False)name module.module.external_feature_model.vit.decoder.layers.20.self_attention.linear_proj.weight lr_decay_rate 0.6561 name module.module.external_feature_model.vit.decoder.layers.21.self_attention.linear_proj.weight lr_decay_rate 0.7290000000000001 name module.module.external_feature_model.vit.decoder.layers.21.self_attention.linear_proj.bias lr_decay_rate 0.7290000000000001_get_param_groups name module.module.decoder.layers.4.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.self_attention.linear_qkv.weight key (1.0, 0.06561, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.pre_mlp_layernorm.bias key (0.0, 0.02287679245496101, False, False) name module.module.external_feature_model.vit.decoder.layers.2.mlp.linear_fc1.bias lr_decay_rate 0.09847709021836118name module.module.external_feature_model.vit.decoder.layers.19.pre_mlp_layernorm.weight lr_decay_rate 0.5904900000000001name module.module.external_feature_model.vit.decoder.layers.1.pre_mlp_layernorm.bias lr_decay_rate 0.08862938119652507 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.self_attention.linear_qkv.bias key (0.0, 0.05314410000000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.pre_mlp_layernorm.bias key (0.0, 0.04782969000000001, False, False) name module.module.external_feature_model.vit.decoder.layers.21.self_attention.linear_qkv.weight lr_decay_rate 0.7290000000000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.self_attention.linear_qkv.weight key (1.0, 0.015009463529699918, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.self_attention.linear_proj.weight key (1.0, 0.06561, False, False)name module.module.external_feature_model.vit.decoder.layers.20.input_layernorm.weight lr_decay_rate 0.6561_get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.self_attention.linear_qkv.bias key (0.0, 0.02541865828329001, False, False) name module.module.external_feature_model.vit.decoder.layers.10.mlp.linear_fc1.weight lr_decay_rate 0.2287679245496101_get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.self_attention.linear_proj.bias key (0.0, 0.0729, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.mlp.linear_fc1.bias key (0.0, 0.00984770902183612, False, False) _get_param_groups name module.module.decoder.layers.4.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.self_attention.linear_proj.weight key (1.0, 0.0729, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.pre_mlp_layernorm.bias key (0.0, 0.008862938119652507, False, False) name module.module.external_feature_model.vit.decoder.layers.18.pre_mlp_layernorm.weight lr_decay_rate 0.531441 name module.module.external_feature_model.vit.decoder.layers.20.self_attention.linear_qkv.bias lr_decay_rate 0.6561_get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.pre_mlp_layernorm.weight key (0.0, 0.05904900000000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.self_attention.linear_qkv.weight key (1.0, 0.0729, False, False) name module.module.external_feature_model.vit.decoder.layers.6.self_attention.linear_qkv.bias lr_decay_rate 0.15009463529699918 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.input_layernorm.weight key (0.0, 0.06561, False, False)name module.module.external_feature_model.vit.decoder.layers.17.mlp.linear_fc1.weight lr_decay_rate 0.4782969000000001 name module.module.external_feature_model.vit.decoder.layers.20.self_attention.linear_proj.bias lr_decay_rate 0.6561name module.module.external_feature_model.vit.decoder.layers.2.mlp.linear_fc2.weight lr_decay_rate 0.09847709021836118_get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.mlp.linear_fc1.weight key (1.0, 0.02287679245496101, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.self_attention.linear_qkv.bias key (0.0, 0.06561, False, False) name module.module.external_feature_model.vit.decoder.layers.11.pre_mlp_layernorm.weight lr_decay_rate 0.2541865828329001_get_param_groups name module.module.decoder.layers.4.mlp.linear_fc2.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.21.self_attention.linear_qkv.weight lr_decay_rate 0.7290000000000001 name module.module.external_feature_model.vit.decoder.layers.21.self_attention.linear_proj.bias lr_decay_rate 0.7290000000000001 name module.module.external_feature_model.vit.decoder.layers.21.self_attention.linear_qkv.bias lr_decay_rate 0.7290000000000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.pre_mlp_layernorm.weight key (0.0, 0.05314410000000001, False, False) name module.module.external_feature_model.vit.decoder.layers.20.input_layernorm.bias lr_decay_rate 0.6561name module.module.external_feature_model.vit.decoder.layers.1.mlp.linear_fc1.weight lr_decay_rate 0.08862938119652507 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.self_attention.linear_qkv.bias key (0.0, 0.015009463529699918, False, False)name module.module.external_feature_model.vit.decoder.layers.19.pre_mlp_layernorm.bias lr_decay_rate 0.5904900000000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.mlp.linear_fc1.weight key (1.0, 0.04782969000000001, False, False) name module.module.external_feature_model.vit.decoder.layers.10.mlp.linear_fc1.bias lr_decay_rate 0.2287679245496101_get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.self_attention.linear_qkv.weight key (1.0, 0.0729, False, False)_get_param_groups name module.module.decoder.layers.5.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.self_attention.linear_proj.bias key (0.0, 0.06561, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.mlp.linear_fc2.weight key (1.0, 0.00984770902183612, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.self_attention.linear_proj.bias key (0.0, 0.0729, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.self_attention.linear_qkv.bias key (0.0, 0.0729, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.pre_mlp_layernorm.weight key (0.0, 0.02541865828329001, False, False) name module.module.external_feature_model.vit.decoder.layers.20.pre_mlp_layernorm.weight lr_decay_rate 0.6561_get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.pre_mlp_layernorm.bias key (0.0, 0.05904900000000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.input_layernorm.bias key (0.0, 0.06561, False, False) name module.module.external_feature_model.vit.decoder.layers.18.pre_mlp_layernorm.bias lr_decay_rate 0.531441 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.mlp.linear_fc1.weight key (1.0, 0.008862938119652507, False, False) name module.module.external_feature_model.vit.decoder.layers.2.mlp.linear_fc2.bias lr_decay_rate 0.09847709021836118name module.module.external_feature_model.vit.decoder.layers.6.pre_mlp_layernorm.weight lr_decay_rate 0.15009463529699918_get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.mlp.linear_fc1.bias key (0.0, 0.02287679245496101, False, False) name module.module.external_feature_model.vit.decoder.layers.17.mlp.linear_fc1.bias lr_decay_rate 0.4782969000000001name module.module.external_feature_model.vit.decoder.layers.21.self_attention.linear_qkv.bias lr_decay_rate 0.7290000000000001 name module.module.external_feature_model.vit.decoder.layers.20.self_attention.linear_qkv.weight lr_decay_rate 0.6561 _get_param_groups name module.module.decoder.layers.5.self_attention.linear_proj.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.21.self_attention.linear_qkv.weight lr_decay_rate 0.7290000000000001name module.module.external_feature_model.vit.decoder.layers.11.pre_mlp_layernorm.bias lr_decay_rate 0.2541865828329001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.pre_mlp_layernorm.weight key (0.0, 0.06561, False, False) name module.module.external_feature_model.vit.decoder.layers.1.mlp.linear_fc1.bias lr_decay_rate 0.08862938119652507_get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.pre_mlp_layernorm.bias key (0.0, 0.05314410000000001, False, False) name module.module.external_feature_model.vit.decoder.layers.21.pre_mlp_layernorm.weight lr_decay_rate 0.7290000000000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.self_attention.linear_qkv.weight key (1.0, 0.06561, False, False)name module.module.external_feature_model.vit.decoder.layers.10.mlp.linear_fc2.weight lr_decay_rate 0.2287679245496101name module.module.external_feature_model.vit.decoder.layers.19.mlp.linear_fc1.weight lr_decay_rate 0.5904900000000001name module.module.external_feature_model.vit.decoder.layers.20.self_attention.linear_proj.weight lr_decay_rate 0.6561 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.mlp.linear_fc2.bias key (0.0, 0.00984770902183612, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.self_attention.linear_qkv.bias key (0.0, 0.0729, False, False)_get_param_groups name module.module.decoder.layers.5.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.pre_mlp_layernorm.weight key (0.0, 0.015009463529699918, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.mlp.linear_fc1.bias key (0.0, 0.04782969000000001, False, False) name module.module.external_feature_model.vit.decoder.layers.18.mlp.linear_fc1.weight lr_decay_rate 0.531441 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.self_attention.linear_qkv.weight key (1.0, 0.0729, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.pre_mlp_layernorm.bias key (0.0, 0.02541865828329001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.mlp.linear_fc1.bias key (0.0, 0.008862938119652507, False, False) name module.module.external_feature_model.vit.decoder.layers.20.pre_mlp_layernorm.bias lr_decay_rate 0.6561 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.mlp.linear_fc1.weight key (1.0, 0.05904900000000001, False, False) _get_param_groups name module.module.decoder.layers.5.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.self_attention.linear_proj.weight key (1.0, 0.06561, False, False) name module.module.external_feature_model.vit.decoder.layers.20.self_attention.linear_qkv.bias lr_decay_rate 0.6561_get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.pre_mlp_layernorm.weight key (0.0, 0.0729, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.mlp.linear_fc2.weight key (1.0, 0.02287679245496101, False, False) name module.module.external_feature_model.vit.decoder.layers.3.ls1 lr_decay_rate 0.10941898913151242 name module.module.external_feature_model.vit.decoder.layers.21.self_attention.linear_qkv.bias lr_decay_rate 0.7290000000000001name module.module.external_feature_model.vit.decoder.layers.17.mlp.linear_fc2.weight lr_decay_rate 0.4782969000000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.mlp.linear_fc1.weight key (1.0, 0.05314410000000001, False, False)name module.module.external_feature_model.vit.decoder.layers.21.pre_mlp_layernorm.weight lr_decay_rate 0.7290000000000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.pre_mlp_layernorm.bias key (0.0, 0.06561, False, False)name module.module.external_feature_model.vit.decoder.layers.11.mlp.linear_fc1.weight lr_decay_rate 0.2541865828329001 name module.module.external_feature_model.vit.decoder.layers.1.mlp.linear_fc2.weight lr_decay_rate 0.08862938119652507 name module.module.external_feature_model.vit.decoder.layers.19.mlp.linear_fc1.bias lr_decay_rate 0.5904900000000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.self_attention.linear_qkv.bias key (0.0, 0.06561, False, False)_get_param_groups name module.module.decoder.layers.5.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.21.pre_mlp_layernorm.bias lr_decay_rate 0.7290000000000001name module.module.external_feature_model.vit.decoder.layers.20.self_attention.linear_proj.bias lr_decay_rate 0.6561name module.module.external_feature_model.vit.decoder.layers.10.mlp.linear_fc2.bias lr_decay_rate 0.2287679245496101 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.self_attention.linear_qkv.bias key (0.0, 0.0729, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.ls1 key (0.0, 0.010941898913151242, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.mlp.linear_fc2.weight key (1.0, 0.04782969000000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.pre_mlp_layernorm.weight key (0.0, 0.0729, False, False)name module.module.external_feature_model.vit.decoder.layers.18.mlp.linear_fc1.bias lr_decay_rate 0.531441 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.mlp.linear_fc1.weight key (1.0, 0.02541865828329001, False, False)name module.module.external_feature_model.vit.decoder.layers.20.mlp.linear_fc1.weight lr_decay_rate 0.6561_get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.mlp.linear_fc2.bias key (0.0, 0.02287679245496101, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.mlp.linear_fc1.bias key (0.0, 0.05904900000000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.pre_mlp_layernorm.bias key (0.0, 0.0729, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.mlp.linear_fc2.weight key (1.0, 0.008862938119652507, False, False)_get_param_groups name module.module.decoder.layers.5.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.self_attention.linear_proj.bias key (0.0, 0.06561, False, False) name module.module.external_feature_model.vit.decoder.layers.20.pre_mlp_layernorm.weight lr_decay_rate 0.6561name module.module.external_feature_model.vit.decoder.layers.3.ls2 lr_decay_rate 0.10941898913151242 name module.module.external_feature_model.vit.decoder.layers.17.mlp.linear_fc2.bias lr_decay_rate 0.4782969000000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.mlp.linear_fc1.bias key (0.0, 0.05314410000000001, False, False)name module.module.external_feature_model.vit.decoder.layers.21.pre_mlp_layernorm.bias lr_decay_rate 0.7290000000000001 _get_param_groups name module.module.decoder.layers.5.mlp.linear_fc2.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.11.ls1 lr_decay_rate 0.2541865828329001name module.module.external_feature_model.vit.decoder.layers.11.mlp.linear_fc1.bias lr_decay_rate 0.2541865828329001 name module.module.external_feature_model.vit.decoder.layers.21.mlp.linear_fc1.weight lr_decay_rate 0.7290000000000001 name module.module.external_feature_model.vit.decoder.layers.20.self_attention.linear_qkv.weight lr_decay_rate 0.6561 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.mlp.linear_fc1.weight key (1.0, 0.06561, False, False) name module.module.external_feature_model.vit.decoder.layers.21.pre_mlp_layernorm.weight lr_decay_rate 0.7290000000000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.ls2 key (0.0, 0.010941898913151242, False, False) name module.module.external_feature_model.vit.decoder.layers.19.mlp.linear_fc2.weight lr_decay_rate 0.5904900000000001name module.module.external_feature_model.vit.decoder.layers.1.mlp.linear_fc2.bias lr_decay_rate 0.08862938119652507name module.module.external_feature_model.vit.decoder.layers.6.pre_mlp_layernorm.bias lr_decay_rate 0.15009463529699918 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.self_attention.linear_qkv.weight key (1.0, 0.06561, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.pre_mlp_layernorm.weight key (0.0, 0.06561, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.mlp.linear_fc1.bias key (0.0, 0.02541865828329001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.mlp.linear_fc2.bias key (0.0, 0.04782969000000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.mlp.linear_fc1.weight key (1.0, 0.0729, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.ls1 key (0.0, 0.02541865828329001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.mlp.linear_fc2.bias key (0.0, 0.008862938119652507, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.pre_mlp_layernorm.bias key (0.0, 0.0729, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.pre_mlp_layernorm.weight key (0.0, 0.0729, False, False) name module.module.external_feature_model.vit.decoder.layers.18.mlp.linear_fc2.weight lr_decay_rate 0.531441_get_param_groups name module.module.decoder.layers.6.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.pre_mlp_layernorm.bias key (0.0, 0.015009463529699918, False, False) name module.module.external_feature_model.vit.decoder.layers.20.mlp.linear_fc1.bias lr_decay_rate 0.6561 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.mlp.linear_fc2.weight key (1.0, 0.05904900000000001, False, False)name module.module.external_feature_model.vit.decoder.layers.3.input_layernorm.weight lr_decay_rate 0.10941898913151242 name module.module.external_feature_model.vit.decoder.layers.20.self_attention.linear_qkv.bias lr_decay_rate 0.6561 name module.module.external_feature_model.vit.decoder.layers.20.pre_mlp_layernorm.bias lr_decay_rate 0.6561 name module.module.external_feature_model.vit.decoder.layers.21.pre_mlp_layernorm.bias lr_decay_rate 0.7290000000000001name module.module.external_feature_model.vit.decoder.layers.11.mlp.linear_fc2.weight lr_decay_rate 0.2541865828329001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.mlp.linear_fc2.weight key (1.0, 0.05314410000000001, False, False)name module.module.external_feature_model.vit.decoder.layers.21.mlp.linear_fc1.weight lr_decay_rate 0.7290000000000001 name module.module.external_feature_model.vit.decoder.layers.21.mlp.linear_fc1.bias lr_decay_rate 0.7290000000000001 name module.module.external_feature_model.vit.decoder.layers.11.ls2 lr_decay_rate 0.2541865828329001 name module.module.external_feature_model.vit.decoder.layers.19.mlp.linear_fc2.bias lr_decay_rate 0.5904900000000001name module.module.external_feature_model.vit.decoder.layers.18.ls1 lr_decay_rate 0.531441 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.mlp.linear_fc1.bias key (0.0, 0.06561, False, False)name module.module.external_feature_model.vit.decoder.layers.6.mlp.linear_fc1.weight lr_decay_rate 0.15009463529699918_get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.self_attention.linear_qkv.bias key (0.0, 0.06561, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.pre_mlp_layernorm.bias key (0.0, 0.06561, False, False)name module.module.external_feature_model.vit.decoder.layers.2.ls1 lr_decay_rate 0.09847709021836118_get_param_groups name module.module.decoder.layers.6.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.mlp.linear_fc2.weight key (1.0, 0.02541865828329001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.input_layernorm.weight key (0.0, 0.010941898913151242, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.pre_mlp_layernorm.bias key (0.0, 0.0729, False, False) name module.module.external_feature_model.vit.decoder.layers.18.mlp.linear_fc2.bias lr_decay_rate 0.531441_get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.mlp.linear_fc1.weight key (1.0, 0.0729, False, False)name module.module.external_feature_model.vit.decoder.layers.20.mlp.linear_fc2.weight lr_decay_rate 0.6561 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.mlp.linear_fc1.bias key (0.0, 0.0729, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.ls2 key (0.0, 0.02541865828329001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.mlp.linear_fc2.bias key (0.0, 0.05904900000000001, False, False)_get_param_groups name module.module.decoder.layers.6.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.ls1 key (0.0, 0.05314410000000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.mlp.linear_fc1.weight key (1.0, 0.015009463529699918, False, False)name module.module.external_feature_model.vit.decoder.layers.11.mlp.linear_fc2.bias lr_decay_rate 0.2541865828329001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.ls1 key (0.0, 0.00984770902183612, False, False) name module.module.external_feature_model.vit.decoder.layers.3.input_layernorm.bias lr_decay_rate 0.10941898913151242name module.module.external_feature_model.vit.decoder.layers.20.mlp.linear_fc1.weight lr_decay_rate 0.6561_get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.mlp.linear_fc2.bias key (0.0, 0.05314410000000001, False, False) name module.module.external_feature_model.vit.decoder.layers.20.pre_mlp_layernorm.weight lr_decay_rate 0.6561_get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.mlp.linear_fc2.weight key (1.0, 0.06561, False, False)name module.module.external_feature_model.vit.decoder.layers.21.mlp.linear_fc1.bias lr_decay_rate 0.7290000000000001 name module.module.external_feature_model.vit.decoder.layers.21.mlp.linear_fc2.weight lr_decay_rate 0.7290000000000001 name module.module.external_feature_model.vit.decoder.layers.21.mlp.linear_fc1.weight lr_decay_rate 0.7290000000000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.mlp.linear_fc2.bias key (0.0, 0.02541865828329001, False, False)name module.module.external_feature_model.vit.decoder.layers.20.ls1 lr_decay_rate 0.6561_get_param_groups name module.module.decoder.layers.6.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.18.ls2 lr_decay_rate 0.531441 name module.module.external_feature_model.vit.decoder.layers.2.ls2 lr_decay_rate 0.09847709021836118name module.module.external_feature_model.vit.decoder.layers.11.input_layernorm.weight lr_decay_rate 0.2541865828329001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.input_layernorm.bias key (0.0, 0.010941898913151242, False, False)name module.module.external_feature_model.vit.decoder.layers.6.mlp.linear_fc1.bias lr_decay_rate 0.15009463529699918 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.mlp.linear_fc1.bias key (0.0, 0.0729, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.mlp.linear_fc1.weight key (1.0, 0.06561, False, False) name module.module.external_feature_model.vit.decoder.layers.19.ls1 lr_decay_rate 0.5904900000000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.pre_mlp_layernorm.weight key (0.0, 0.06561, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.mlp.linear_fc2.weight key (1.0, 0.0729, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.input_layernorm.weight key (0.0, 0.02541865828329001, False, False)name module.module.external_feature_model.vit.decoder.layers.20.mlp.linear_fc2.bias lr_decay_rate 0.6561 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.mlp.linear_fc1.weight key (1.0, 0.0729, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.ls1 key (0.0, 0.06561, False, False) name module.module.external_feature_model.vit.decoder.layers.12.ls1 lr_decay_rate 0.2824295364810001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.ls2 key (0.0, 0.05314410000000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.ls2 key (0.0, 0.00984770902183612, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.mlp.linear_fc1.bias key (0.0, 0.015009463529699918, False, False)_get_param_groups name module.module.decoder.layers.6.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.11.input_layernorm.bias lr_decay_rate 0.2541865828329001 name module.module.external_feature_model.vit.decoder.layers.21.mlp.linear_fc2.weight lr_decay_rate 0.7290000000000001name module.module.external_feature_model.vit.decoder.layers.3.self_attention.linear_proj.weight lr_decay_rate 0.10941898913151242 name module.module.external_feature_model.vit.decoder.layers.20.pre_mlp_layernorm.bias lr_decay_rate 0.6561 name module.module.external_feature_model.vit.decoder.layers.21.mlp.linear_fc2.bias lr_decay_rate 0.7290000000000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.mlp.linear_fc2.bias key (0.0, 0.06561, False, False)name module.module.external_feature_model.vit.decoder.layers.20.mlp.linear_fc1.bias lr_decay_rate 0.6561_get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.ls1 key (0.0, 0.05904900000000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.ls1 key (0.0, 0.028242953648100012, False, False) name module.module.external_feature_model.vit.decoder.layers.21.mlp.linear_fc1.bias lr_decay_rate 0.7290000000000001 _get_param_groups name module.module.decoder.layers.6.mlp.linear_fc1.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.20.ls2 lr_decay_rate 0.6561name module.module.external_feature_model.vit.decoder.layers.18.input_layernorm.weight lr_decay_rate 0.531441_get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.input_layernorm.bias key (0.0, 0.02541865828329001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.mlp.linear_fc2.weight key (1.0, 0.0729, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.pre_mlp_layernorm.bias key (0.0, 0.06561, False, False)name module.module.external_feature_model.vit.decoder.layers.6.mlp.linear_fc2.weight lr_decay_rate 0.15009463529699918 name module.module.external_feature_model.vit.decoder.layers.2.input_layernorm.weight lr_decay_rate 0.09847709021836118 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.self_attention.linear_proj.weight key (1.0, 0.010941898913151242, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.mlp.linear_fc2.bias key (0.0, 0.0729, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.mlp.linear_fc1.bias key (0.0, 0.06561, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.mlp.linear_fc1.bias key (0.0, 0.0729, False, False)name module.module.external_feature_model.vit.decoder.layers.21.mlp.linear_fc2.bias lr_decay_rate 0.7290000000000001name module.module.external_feature_model.vit.decoder.layers.19.ls2 lr_decay_rate 0.5904900000000001name module.module.external_feature_model.vit.decoder.layers.21.ls1 lr_decay_rate 0.7290000000000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.input_layernorm.weight key (0.0, 0.05314410000000001, False, False)name module.module.external_feature_model.vit.decoder.layers.12.ls2 lr_decay_rate 0.2824295364810001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.ls2 key (0.0, 0.06561, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.mlp.linear_fc2.weight key (1.0, 0.015009463529699918, False, False) _get_param_groups name module.module.decoder.layers.6.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.input_layernorm.weight key (0.0, 0.00984770902183612, False, False)name module.module.external_feature_model.vit.decoder.layers.20.mlp.linear_fc1.weight lr_decay_rate 0.6561name module.module.external_feature_model.vit.decoder.layers.3.self_attention.linear_proj.bias lr_decay_rate 0.10941898913151242 name module.module.external_feature_model.vit.decoder.layers.11.self_attention.linear_proj.weight lr_decay_rate 0.2541865828329001 name module.module.external_feature_model.vit.decoder.layers.22.ls1 lr_decay_rate 0.81 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.ls1 key (0.0, 0.0729, False, False)name module.module.external_feature_model.vit.decoder.layers.21.mlp.linear_fc2.weight lr_decay_rate 0.7290000000000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.ls2 key (0.0, 0.028242953648100012, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.mlp.linear_fc2.bias key (0.0, 0.0729, False, False) name module.module.external_feature_model.vit.decoder.layers.20.input_layernorm.weight lr_decay_rate 0.6561 name module.module.external_feature_model.vit.decoder.layers.20.mlp.linear_fc2.weight lr_decay_rate 0.6561_get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.ls2 key (0.0, 0.05904900000000001, False, False)name module.module.external_feature_model.vit.decoder.layers.18.input_layernorm.bias lr_decay_rate 0.531441_get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.mlp.linear_fc1.weight key (1.0, 0.06561, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.ls1 key (0.0, 0.08100000000000002, False, False) name module.module.external_feature_model.vit.decoder.layers.6.mlp.linear_fc2.bias lr_decay_rate 0.15009463529699918_get_param_groups name module.module.decoder.layers.7.input_layernorm.weight key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.2.input_layernorm.bias lr_decay_rate 0.09847709021836118 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.self_attention.linear_proj.bias key (0.0, 0.010941898913151242, False, False) name module.module.external_feature_model.vit.decoder.layers.21.ls2 lr_decay_rate 0.7290000000000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.self_attention.linear_proj.weight key (1.0, 0.02541865828329001, False, False)name module.module.external_feature_model.vit.decoder.layers.12.input_layernorm.weight lr_decay_rate 0.2824295364810001name module.module.external_feature_model.vit.decoder.layers.22.ls1 lr_decay_rate 0.81 name module.module.external_feature_model.vit.decoder.layers.20.mlp.linear_fc1.bias lr_decay_rate 0.6561_get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.mlp.linear_fc2.weight key (1.0, 0.0729, False, False) name module.module.external_feature_model.vit.decoder.layers.19.input_layernorm.weight lr_decay_rate 0.5904900000000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.input_layernorm.weight key (0.0, 0.06561, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.mlp.linear_fc2.weight key (1.0, 0.06561, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.mlp.linear_fc2.bias key (0.0, 0.015009463529699918, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.input_layernorm.bias key (0.0, 0.05314410000000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.input_layernorm.bias key (0.0, 0.00984770902183612, False, False) _get_param_groups name module.module.decoder.layers.7.self_attention.linear_proj.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.22.ls2 lr_decay_rate 0.81 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.ls2 key (0.0, 0.0729, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.ls1 key (0.0, 0.08100000000000002, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.input_layernorm.weight key (0.0, 0.028242953648100012, False, False) name module.module.external_feature_model.vit.decoder.layers.3.self_attention.linear_qkv.weight lr_decay_rate 0.10941898913151242name module.module.external_feature_model.vit.decoder.layers.11.self_attention.linear_proj.bias lr_decay_rate 0.2541865828329001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.mlp.linear_fc1.bias key (0.0, 0.06561, False, False) name module.module.external_feature_model.vit.decoder.layers.21.mlp.linear_fc2.bias lr_decay_rate 0.7290000000000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.input_layernorm.weight key (0.0, 0.05904900000000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.ls2 key (0.0, 0.08100000000000002, False, False) name module.module.external_feature_model.vit.decoder.layers.20.input_layernorm.bias lr_decay_rate 0.6561name module.module.external_feature_model.vit.decoder.layers.20.mlp.linear_fc2.bias lr_decay_rate 0.6561 _get_param_groups name module.module.decoder.layers.7.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.22.ls2 lr_decay_rate 0.81 name module.module.external_feature_model.vit.decoder.layers.2.self_attention.linear_proj.weight lr_decay_rate 0.09847709021836118name module.module.external_feature_model.vit.decoder.layers.7.ls1 lr_decay_rate 0.16677181699666577_get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.self_attention.linear_qkv.weight key (1.0, 0.010941898913151242, False, False) name module.module.external_feature_model.vit.decoder.layers.21.input_layernorm.weight lr_decay_rate 0.7290000000000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.self_attention.linear_proj.bias key (0.0, 0.02541865828329001, False, False)name module.module.external_feature_model.vit.decoder.layers.18.self_attention.linear_proj.weight lr_decay_rate 0.531441 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.mlp.linear_fc2.bias key (0.0, 0.06561, False, False) name module.module.external_feature_model.vit.decoder.layers.19.input_layernorm.bias lr_decay_rate 0.5904900000000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.mlp.linear_fc2.bias key (0.0, 0.0729, False, False)name module.module.external_feature_model.vit.decoder.layers.12.input_layernorm.bias lr_decay_rate 0.2824295364810001 name module.module.external_feature_model.vit.decoder.layers.20.mlp.linear_fc2.weight lr_decay_rate 0.6561 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.input_layernorm.bias key (0.0, 0.06561, False, False)name module.module.external_feature_model.vit.decoder.layers.22.input_layernorm.weight lr_decay_rate 0.81 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.self_attention.linear_proj.weight key (1.0, 0.00984770902183612, False, False)_get_param_groups name module.module.decoder.layers.7.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.ls2 key (0.0, 0.08100000000000002, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.input_layernorm.weight key (0.0, 0.0729, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.ls1 key (0.0, 0.016677181699666577, False, False) name module.module.external_feature_model.vit.decoder.layers.11.self_attention.linear_qkv.weight lr_decay_rate 0.2541865828329001name module.module.external_feature_model.vit.decoder.layers.3.self_attention.linear_qkv.bias lr_decay_rate 0.10941898913151242name module.module.external_feature_model.vit.decoder.layers.21.ls1 lr_decay_rate 0.7290000000000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.mlp.linear_fc2.weight key (1.0, 0.06561, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.input_layernorm.bias key (0.0, 0.05904900000000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.self_attention.linear_proj.weight key (1.0, 0.05314410000000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.input_layernorm.bias key (0.0, 0.028242953648100012, False, False) name module.module.external_feature_model.vit.decoder.layers.22.ls1 lr_decay_rate 0.81 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.input_layernorm.weight key (0.0, 0.08100000000000002, False, False) name module.module.external_feature_model.vit.decoder.layers.2.self_attention.linear_proj.bias lr_decay_rate 0.09847709021836118name module.module.external_feature_model.vit.decoder.layers.20.self_attention.linear_proj.weight lr_decay_rate 0.6561_get_param_groups name module.module.decoder.layers.7.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.22.input_layernorm.weight lr_decay_rate 0.81 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.self_attention.linear_qkv.weight key (1.0, 0.02541865828329001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.self_attention.linear_qkv.bias key (0.0, 0.010941898913151242, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.ls1 key (0.0, 0.0729, False, False)name module.module.external_feature_model.vit.decoder.layers.7.ls2 lr_decay_rate 0.16677181699666577name module.module.external_feature_model.vit.decoder.layers.21.input_layernorm.bias lr_decay_rate 0.7290000000000001 name module.module.external_feature_model.vit.decoder.layers.22.input_layernorm.bias lr_decay_rate 0.81 name module.module.external_feature_model.vit.decoder.layers.20.mlp.linear_fc2.bias lr_decay_rate 0.6561 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.ls1 key (0.0, 0.08100000000000002, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.self_attention.linear_proj.weight key (1.0, 0.06561, False, False) name module.module.external_feature_model.vit.decoder.layers.12.self_attention.linear_proj.weight lr_decay_rate 0.2824295364810001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.self_attention.linear_proj.bias key (0.0, 0.00984770902183612, False, False) name module.module.external_feature_model.vit.decoder.layers.19.self_attention.linear_proj.weight lr_decay_rate 0.5904900000000001name module.module.external_feature_model.vit.decoder.layers.18.self_attention.linear_proj.bias lr_decay_rate 0.531441_get_param_groups name module.module.decoder.layers.7.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.input_layernorm.weight key (0.0, 0.08100000000000002, False, False)name module.module.external_feature_model.vit.decoder.layers.21.ls2 lr_decay_rate 0.7290000000000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.input_layernorm.bias key (0.0, 0.0729, False, False) name module.module.external_feature_model.vit.decoder.layers.22.ls2 lr_decay_rate 0.81 name module.module.external_feature_model.vit.decoder.layers.11.self_attention.linear_qkv.bias lr_decay_rate 0.2541865828329001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.ls2 key (0.0, 0.016677181699666577, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.input_layernorm.bias key (0.0, 0.08100000000000002, False, False) name module.module.external_feature_model.vit.decoder.layers.20.self_attention.linear_proj.bias lr_decay_rate 0.6561name module.module.external_feature_model.vit.decoder.layers.3.pre_mlp_layernorm.weight lr_decay_rate 0.10941898913151242_get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.mlp.linear_fc2.bias key (0.0, 0.06561, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.self_attention.linear_proj.weight key (1.0, 0.028242953648100012, False, False) _get_param_groups name module.module.decoder.layers.7.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.self_attention.linear_proj.weight key (1.0, 0.05904900000000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.ls2 key (0.0, 0.0729, False, False)name module.module.external_feature_model.vit.decoder.layers.2.self_attention.linear_qkv.weight lr_decay_rate 0.09847709021836118 name module.module.external_feature_model.vit.decoder.layers.22.input_layernorm.bias lr_decay_rate 0.81 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.self_attention.linear_proj.bias key (0.0, 0.05314410000000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.ls2 key (0.0, 0.08100000000000002, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.self_attention.linear_qkv.bias key (0.0, 0.02541865828329001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.self_attention.linear_proj.bias key (0.0, 0.06561, False, False) name module.module.external_feature_model.vit.decoder.layers.21.self_attention.linear_proj.weight lr_decay_rate 0.7290000000000001 name module.module.external_feature_model.vit.decoder.layers.7.input_layernorm.weight lr_decay_rate 0.16677181699666577_get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.pre_mlp_layernorm.weight key (0.0, 0.010941898913151242, False, False)name module.module.external_feature_model.vit.decoder.layers.12.self_attention.linear_proj.bias lr_decay_rate 0.2824295364810001name module.module.external_feature_model.vit.decoder.layers.22.self_attention.linear_proj.weight lr_decay_rate 0.81 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.self_attention.linear_qkv.weight key (1.0, 0.00984770902183612, False, False)name module.module.external_feature_model.vit.decoder.layers.19.self_attention.linear_proj.bias lr_decay_rate 0.5904900000000001name module.module.external_feature_model.vit.decoder.layers.21.input_layernorm.weight lr_decay_rate 0.7290000000000001 name module.module.external_feature_model.vit.decoder.layers.21.ls1 lr_decay_rate 0.7290000000000001_get_param_groups name module.module.decoder.layers.8.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.input_layernorm.bias key (0.0, 0.08100000000000002, False, False) name module.module.external_feature_model.vit.decoder.layers.20.self_attention.linear_qkv.weight lr_decay_rate 0.6561 name module.module.external_feature_model.vit.decoder.layers.18.self_attention.linear_qkv.weight lr_decay_rate 0.531441_get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.self_attention.linear_proj.bias key (0.0, 0.05904900000000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.input_layernorm.weight key (0.0, 0.016677181699666577, False, False)name module.module.external_feature_model.vit.decoder.layers.22.input_layernorm.weight lr_decay_rate 0.81 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.self_attention.linear_proj.bias key (0.0, 0.028242953648100012, False, False) name module.module.external_feature_model.vit.decoder.layers.11.pre_mlp_layernorm.weight lr_decay_rate 0.2541865828329001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.self_attention.linear_proj.weight key (1.0, 0.0729, False, False) name module.module.external_feature_model.vit.decoder.layers.3.pre_mlp_layernorm.bias lr_decay_rate 0.10941898913151242 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.self_attention.linear_proj.weight key (1.0, 0.08100000000000002, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.input_layernorm.weight key (0.0, 0.0729, False, False) _get_param_groups name module.module.decoder.layers.8.self_attention.linear_proj.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.2.self_attention.linear_qkv.bias lr_decay_rate 0.09847709021836118_get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.ls1 key (0.0, 0.0729, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.self_attention.linear_qkv.weight key (1.0, 0.05314410000000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.self_attention.linear_qkv.weight key (1.0, 0.06561, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.input_layernorm.weight key (0.0, 0.08100000000000002, False, False)name module.module.external_feature_model.vit.decoder.layers.7.input_layernorm.bias lr_decay_rate 0.16677181699666577name module.module.external_feature_model.vit.decoder.layers.19.self_attention.linear_qkv.weight lr_decay_rate 0.5904900000000001 name module.module.external_feature_model.vit.decoder.layers.22.self_attention.linear_proj.weight lr_decay_rate 0.81 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.pre_mlp_layernorm.weight key (0.0, 0.02541865828329001, False, False)name module.module.external_feature_model.vit.decoder.layers.21.self_attention.linear_proj.bias lr_decay_rate 0.7290000000000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.pre_mlp_layernorm.bias key (0.0, 0.010941898913151242, False, False)name module.module.external_feature_model.vit.decoder.layers.12.self_attention.linear_qkv.weight lr_decay_rate 0.2824295364810001 name module.module.external_feature_model.vit.decoder.layers.21.input_layernorm.bias lr_decay_rate 0.7290000000000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.self_attention.linear_qkv.bias key (0.0, 0.00984770902183612, False, False) name module.module.external_feature_model.vit.decoder.layers.22.self_attention.linear_proj.bias lr_decay_rate 0.81_get_param_groups name module.module.decoder.layers.8.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.21.ls2 lr_decay_rate 0.7290000000000001 name module.module.external_feature_model.vit.decoder.layers.20.self_attention.linear_qkv.bias lr_decay_rate 0.6561name module.module.external_feature_model.vit.decoder.layers.18.self_attention.linear_qkv.bias lr_decay_rate 0.531441_get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.input_layernorm.bias key (0.0, 0.016677181699666577, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.self_attention.linear_proj.weight key (1.0, 0.08100000000000002, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.self_attention.linear_qkv.weight key (1.0, 0.05904900000000001, False, False)name module.module.external_feature_model.vit.decoder.layers.3.mlp.linear_fc1.weight lr_decay_rate 0.10941898913151242 name module.module.external_feature_model.vit.decoder.layers.11.pre_mlp_layernorm.bias lr_decay_rate 0.2541865828329001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.self_attention.linear_proj.bias key (0.0, 0.0729, False, False)name module.module.external_feature_model.vit.decoder.layers.22.input_layernorm.bias lr_decay_rate 0.81_get_param_groups name module.module.decoder.layers.8.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.input_layernorm.bias key (0.0, 0.0729, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.self_attention.linear_qkv.weight key (1.0, 0.028242953648100012, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.ls2 key (0.0, 0.0729, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.mlp.linear_fc1.weight key (1.0, 0.010941898913151242, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.self_attention.linear_proj.bias key (0.0, 0.08100000000000002, False, False)name module.module.external_feature_model.vit.decoder.layers.2.pre_mlp_layernorm.weight lr_decay_rate 0.09847709021836118_get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.self_attention.linear_qkv.bias key (0.0, 0.06561, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.input_layernorm.bias key (0.0, 0.08100000000000002, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.self_attention.linear_qkv.bias key (0.0, 0.05314410000000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.pre_mlp_layernorm.bias key (0.0, 0.02541865828329001, False, False) name module.module.external_feature_model.vit.decoder.layers.22.self_attention.linear_proj.bias lr_decay_rate 0.81 _get_param_groups name module.module.decoder.layers.8.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.19.self_attention.linear_qkv.bias lr_decay_rate 0.5904900000000001 name module.module.external_feature_model.vit.decoder.layers.21.self_attention.linear_qkv.weight lr_decay_rate 0.7290000000000001name module.module.external_feature_model.vit.decoder.layers.12.self_attention.linear_qkv.bias lr_decay_rate 0.2824295364810001name module.module.external_feature_model.vit.decoder.layers.7.self_attention.linear_proj.weight lr_decay_rate 0.16677181699666577 name module.module.external_feature_model.vit.decoder.layers.21.input_layernorm.weight lr_decay_rate 0.7290000000000001name module.module.external_feature_model.vit.decoder.layers.3.mlp.linear_fc1.bias lr_decay_rate 0.10941898913151242 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.pre_mlp_layernorm.weight key (0.0, 0.00984770902183612, False, False) name module.module.external_feature_model.vit.decoder.layers.21.self_attention.linear_proj.weight lr_decay_rate 0.7290000000000001name module.module.external_feature_model.vit.decoder.layers.22.self_attention.linear_qkv.weight lr_decay_rate 0.81 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.self_attention.linear_proj.bias key (0.0, 0.08100000000000002, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.self_attention.linear_qkv.bias key (0.0, 0.05904900000000001, False, False)name module.module.external_feature_model.vit.decoder.layers.22.self_attention.linear_proj.weight lr_decay_rate 0.81 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.mlp.linear_fc1.bias key (0.0, 0.010941898913151242, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.self_attention.linear_qkv.bias key (0.0, 0.028242953648100012, False, False) name module.module.external_feature_model.vit.decoder.layers.20.pre_mlp_layernorm.weight lr_decay_rate 0.6561name module.module.external_feature_model.vit.decoder.layers.11.mlp.linear_fc1.weight lr_decay_rate 0.2541865828329001_get_param_groups name module.module.decoder.layers.8.mlp.linear_fc1.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.18.pre_mlp_layernorm.weight lr_decay_rate 0.531441_get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.self_attention.linear_qkv.weight key (1.0, 0.0729, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.self_attention.linear_proj.weight key (1.0, 0.016677181699666577, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.input_layernorm.weight key (0.0, 0.0729, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.self_attention.linear_proj.weight key (1.0, 0.0729, False, False)name module.module.external_feature_model.vit.decoder.layers.2.pre_mlp_layernorm.bias lr_decay_rate 0.09847709021836118_get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.self_attention.linear_qkv.weight key (1.0, 0.08100000000000002, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.mlp.linear_fc1.weight key (1.0, 0.02541865828329001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.self_attention.linear_proj.weight key (1.0, 0.08100000000000002, False, False) name module.module.external_feature_model.vit.decoder.layers.22.self_attention.linear_qkv.weight lr_decay_rate 0.81_get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.pre_mlp_layernorm.weight key (0.0, 0.05314410000000001, False, False)name module.module.external_feature_model.vit.decoder.layers.21.self_attention.linear_qkv.bias lr_decay_rate 0.7290000000000001name module.module.external_feature_model.vit.decoder.layers.7.self_attention.linear_proj.bias lr_decay_rate 0.16677181699666577 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.pre_mlp_layernorm.weight key (0.0, 0.06561, False, False) name module.module.external_feature_model.vit.decoder.layers.19.pre_mlp_layernorm.weight lr_decay_rate 0.5904900000000001name module.module.external_feature_model.vit.decoder.layers.3.mlp.linear_fc2.weight lr_decay_rate 0.10941898913151242_get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.pre_mlp_layernorm.bias key (0.0, 0.00984770902183612, False, False)_get_param_groups name module.module.decoder.layers.8.mlp.linear_fc2.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.22.self_attention.linear_proj.bias lr_decay_rate 0.81name module.module.external_feature_model.vit.decoder.layers.22.self_attention.linear_qkv.bias lr_decay_rate 0.81name module.module.external_feature_model.vit.decoder.layers.21.input_layernorm.bias lr_decay_rate 0.7290000000000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.self_attention.linear_proj.bias key (0.0, 0.016677181699666577, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.self_attention.linear_qkv.weight key (1.0, 0.08100000000000002, False, False) name module.module.external_feature_model.vit.decoder.layers.12.pre_mlp_layernorm.weight lr_decay_rate 0.2824295364810001 name module.module.external_feature_model.vit.decoder.layers.21.self_attention.linear_proj.bias lr_decay_rate 0.7290000000000001 name module.module.external_feature_model.vit.decoder.layers.11.mlp.linear_fc1.bias lr_decay_rate 0.2541865828329001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.self_attention.linear_qkv.bias key (0.0, 0.0729, False, False) name module.module.external_feature_model.vit.decoder.layers.20.pre_mlp_layernorm.bias lr_decay_rate 0.6561name module.module.external_feature_model.vit.decoder.layers.18.pre_mlp_layernorm.bias lr_decay_rate 0.531441 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.mlp.linear_fc2.weight key (1.0, 0.010941898913151242, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.pre_mlp_layernorm.weight key (0.0, 0.05904900000000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.self_attention.linear_proj.bias key (0.0, 0.08100000000000002, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.self_attention.linear_qkv.bias key (0.0, 0.08100000000000002, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.input_layernorm.bias key (0.0, 0.0729, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.pre_mlp_layernorm.weight key (0.0, 0.028242953648100012, False, False) name module.module.external_feature_model.vit.decoder.layers.7.self_attention.linear_qkv.weight lr_decay_rate 0.16677181699666577 _get_param_groups name module.module.decoder.layers.9.input_layernorm.weight key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.2.mlp.linear_fc1.weight lr_decay_rate 0.09847709021836118name module.module.external_feature_model.vit.decoder.layers.22.self_attention.linear_qkv.bias lr_decay_rate 0.81_get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.self_attention.linear_proj.bias key (0.0, 0.0729, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.mlp.linear_fc1.bias key (0.0, 0.02541865828329001, False, False) name module.module.external_feature_model.vit.decoder.layers.3.mlp.linear_fc2.bias lr_decay_rate 0.10941898913151242name module.module.external_feature_model.vit.decoder.layers.19.pre_mlp_layernorm.bias lr_decay_rate 0.5904900000000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.pre_mlp_layernorm.bias key (0.0, 0.06561, False, False) name module.module.external_feature_model.vit.decoder.layers.12.pre_mlp_layernorm.bias lr_decay_rate 0.2824295364810001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.pre_mlp_layernorm.bias key (0.0, 0.05314410000000001, False, False)name module.module.external_feature_model.vit.decoder.layers.21.pre_mlp_layernorm.weight lr_decay_rate 0.7290000000000001name module.module.external_feature_model.vit.decoder.layers.22.self_attention.linear_qkv.weight lr_decay_rate 0.81_get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.self_attention.linear_qkv.bias key (0.0, 0.08100000000000002, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.self_attention.linear_qkv.weight key (1.0, 0.016677181699666577, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.mlp.linear_fc2.bias key (0.0, 0.010941898913151242, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.pre_mlp_layernorm.bias key (0.0, 0.05904900000000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.mlp.linear_fc1.weight key (1.0, 0.00984770902183612, False, False) _get_param_groups name module.module.decoder.layers.9.self_attention.linear_proj.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.21.self_attention.linear_qkv.weight lr_decay_rate 0.7290000000000001name module.module.external_feature_model.vit.decoder.layers.22.pre_mlp_layernorm.weight lr_decay_rate 0.81 name module.module.external_feature_model.vit.decoder.layers.20.mlp.linear_fc1.weight lr_decay_rate 0.6561name module.module.external_feature_model.vit.decoder.layers.21.self_attention.linear_proj.weight lr_decay_rate 0.7290000000000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.pre_mlp_layernorm.bias key (0.0, 0.028242953648100012, False, False) name module.module.external_feature_model.vit.decoder.layers.11.mlp.linear_fc2.weight lr_decay_rate 0.2541865828329001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.self_attention.linear_qkv.weight key (1.0, 0.08100000000000002, False, False)name module.module.external_feature_model.vit.decoder.layers.18.mlp.linear_fc1.weight lr_decay_rate 0.531441name module.module.external_feature_model.vit.decoder.layers.7.self_attention.linear_qkv.bias lr_decay_rate 0.16677181699666577 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.pre_mlp_layernorm.weight key (0.0, 0.0729, False, False) name module.module.external_feature_model.vit.decoder.layers.4.ls1 lr_decay_rate 0.12157665459056935 name module.module.external_feature_model.vit.decoder.layers.22.pre_mlp_layernorm.weight lr_decay_rate 0.81name module.module.external_feature_model.vit.decoder.layers.19.mlp.linear_fc1.weight lr_decay_rate 0.5904900000000001 name module.module.external_feature_model.vit.decoder.layers.2.mlp.linear_fc1.bias lr_decay_rate 0.09847709021836118_get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.self_attention.linear_qkv.weight key (1.0, 0.0729, False, False) _get_param_groups name module.module.decoder.layers.9.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.mlp.linear_fc1.weight key (1.0, 0.06561, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.self_attention.linear_proj.weight key (1.0, 0.0729, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.mlp.linear_fc2.weight key (1.0, 0.02541865828329001, False, False) name module.module.external_feature_model.vit.decoder.layers.22.self_attention.linear_qkv.bias lr_decay_rate 0.81_get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.pre_mlp_layernorm.weight key (0.0, 0.08100000000000002, False, False) name module.module.external_feature_model.vit.decoder.layers.21.pre_mlp_layernorm.bias lr_decay_rate 0.7290000000000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.self_attention.linear_qkv.bias key (0.0, 0.016677181699666577, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.ls1 key (0.0, 0.012157665459056936, False, False) _get_param_groups name module.module.decoder.layers.9.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.mlp.linear_fc1.weight key (1.0, 0.05314410000000001, False, False)name module.module.external_feature_model.vit.decoder.layers.12.mlp.linear_fc1.weight lr_decay_rate 0.2824295364810001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.pre_mlp_layernorm.weight key (0.0, 0.08100000000000002, False, False) name module.module.external_feature_model.vit.decoder.layers.20.mlp.linear_fc1.bias lr_decay_rate 0.6561 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.mlp.linear_fc1.weight key (1.0, 0.05904900000000001, False, False)name module.module.external_feature_model.vit.decoder.layers.21.self_attention.linear_qkv.bias lr_decay_rate 0.7290000000000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.mlp.linear_fc1.bias key (0.0, 0.00984770902183612, False, False) name module.module.external_feature_model.vit.decoder.layers.22.pre_mlp_layernorm.bias lr_decay_rate 0.81 name module.module.external_feature_model.vit.decoder.layers.11.mlp.linear_fc2.bias lr_decay_rate 0.2541865828329001name module.module.external_feature_model.vit.decoder.layers.21.self_attention.linear_proj.bias lr_decay_rate 0.7290000000000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.self_attention.linear_qkv.bias key (0.0, 0.08100000000000002, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.pre_mlp_layernorm.bias key (0.0, 0.0729, False, False) name module.module.external_feature_model.vit.decoder.layers.4.ls2 lr_decay_rate 0.12157665459056935name module.module.external_feature_model.vit.decoder.layers.7.pre_mlp_layernorm.weight lr_decay_rate 0.16677181699666577 name module.module.external_feature_model.vit.decoder.layers.19.mlp.linear_fc1.bias lr_decay_rate 0.5904900000000001 _get_param_groups name module.module.decoder.layers.9.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.18.mlp.linear_fc1.bias lr_decay_rate 0.531441name module.module.external_feature_model.vit.decoder.layers.22.pre_mlp_layernorm.bias lr_decay_rate 0.81 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.mlp.linear_fc1.bias key (0.0, 0.06561, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.mlp.linear_fc1.weight key (1.0, 0.028242953648100012, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.self_attention.linear_qkv.bias key (0.0, 0.0729, False, False) name module.module.external_feature_model.vit.decoder.layers.2.mlp.linear_fc2.weight lr_decay_rate 0.09847709021836118 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.pre_mlp_layernorm.bias key (0.0, 0.08100000000000002, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.mlp.linear_fc2.bias key (0.0, 0.02541865828329001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.self_attention.linear_proj.bias key (0.0, 0.0729, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.ls2 key (0.0, 0.012157665459056936, False, False)name module.module.external_feature_model.vit.decoder.layers.21.mlp.linear_fc1.weight lr_decay_rate 0.7290000000000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.pre_mlp_layernorm.weight key (0.0, 0.016677181699666577, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.mlp.linear_fc1.bias key (0.0, 0.05904900000000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.mlp.linear_fc1.bias key (0.0, 0.05314410000000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.pre_mlp_layernorm.bias key (0.0, 0.08100000000000002, False, False) name module.module.external_feature_model.vit.decoder.layers.22.pre_mlp_layernorm.weight lr_decay_rate 0.81 name module.module.external_feature_model.vit.decoder.layers.20.mlp.linear_fc2.weight lr_decay_rate 0.6561 _get_param_groups name module.module.decoder.layers.9.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.mlp.linear_fc2.weight key (1.0, 0.00984770902183612, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.mlp.linear_fc1.weight key (1.0, 0.0729, False, False)name module.module.external_feature_model.vit.decoder.layers.22.mlp.linear_fc1.weight lr_decay_rate 0.81 name module.module.external_feature_model.vit.decoder.layers.12.mlp.linear_fc1.bias lr_decay_rate 0.2824295364810001 name module.module.external_feature_model.vit.decoder.layers.12.ls1 lr_decay_rate 0.2824295364810001name module.module.external_feature_model.vit.decoder.layers.21.pre_mlp_layernorm.weight lr_decay_rate 0.7290000000000001name module.module.external_feature_model.vit.decoder.layers.21.self_attention.linear_qkv.weight lr_decay_rate 0.7290000000000001 name module.module.external_feature_model.vit.decoder.layers.7.pre_mlp_layernorm.bias lr_decay_rate 0.16677181699666577name module.module.external_feature_model.vit.decoder.layers.4.input_layernorm.weight lr_decay_rate 0.12157665459056935 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.mlp.linear_fc2.weight key (1.0, 0.06561, False, False) name module.module.external_feature_model.vit.decoder.layers.19.mlp.linear_fc2.weight lr_decay_rate 0.5904900000000001 name module.module.external_feature_model.vit.decoder.layers.22.mlp.linear_fc1.weight lr_decay_rate 0.81name module.module.external_feature_model.vit.decoder.layers.2.mlp.linear_fc2.bias lr_decay_rate 0.09847709021836118 name module.module.external_feature_model.vit.decoder.layers.18.mlp.linear_fc2.weight lr_decay_rate 0.531441_get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.pre_mlp_layernorm.weight key (0.0, 0.08100000000000002, False, False)_get_param_groups name module.module.decoder.layers.9.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.ls1 key (0.0, 0.028242953648100012, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.mlp.linear_fc1.weight key (1.0, 0.08100000000000002, False, False) name module.module.external_feature_model.vit.decoder.layers.21.mlp.linear_fc1.bias lr_decay_rate 0.7290000000000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.mlp.linear_fc1.bias key (0.0, 0.028242953648100012, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.pre_mlp_layernorm.weight key (0.0, 0.0729, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.self_attention.linear_qkv.weight key (1.0, 0.0729, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.pre_mlp_layernorm.bias key (0.0, 0.016677181699666577, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.mlp.linear_fc2.weight key (1.0, 0.05904900000000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.input_layernorm.weight key (0.0, 0.012157665459056936, False, False) name module.module.external_feature_model.vit.decoder.layers.20.mlp.linear_fc2.bias lr_decay_rate 0.6561_get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.mlp.linear_fc1.weight key (1.0, 0.08100000000000002, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.mlp.linear_fc2.bias key (0.0, 0.00984770902183612, False, False)name module.module.external_feature_model.vit.decoder.layers.12.ls2 lr_decay_rate 0.2824295364810001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.mlp.linear_fc2.weight key (1.0, 0.05314410000000001, False, False) name module.module.external_feature_model.vit.decoder.layers.22.pre_mlp_layernorm.bias lr_decay_rate 0.81 name module.module.external_feature_model.vit.decoder.layers.22.mlp.linear_fc1.bias lr_decay_rate 0.81_get_param_groups name module.module.decoder.layers.10.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.mlp.linear_fc1.bias key (0.0, 0.0729, False, False) name module.module.external_feature_model.vit.decoder.layers.4.input_layernorm.bias lr_decay_rate 0.12157665459056935name module.module.external_feature_model.vit.decoder.layers.22.mlp.linear_fc1.bias lr_decay_rate 0.81name module.module.external_feature_model.vit.decoder.layers.19.mlp.linear_fc2.bias lr_decay_rate 0.5904900000000001name module.module.external_feature_model.vit.decoder.layers.7.mlp.linear_fc1.weight lr_decay_rate 0.16677181699666577name module.module.external_feature_model.vit.decoder.layers.12.mlp.linear_fc2.weight lr_decay_rate 0.2824295364810001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.ls2 key (0.0, 0.028242953648100012, False, False)name module.module.external_feature_model.vit.decoder.layers.21.pre_mlp_layernorm.bias lr_decay_rate 0.7290000000000001 name module.module.external_feature_model.vit.decoder.layers.21.self_attention.linear_qkv.bias lr_decay_rate 0.7290000000000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.mlp.linear_fc2.bias key (0.0, 0.06561, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.pre_mlp_layernorm.bias key (0.0, 0.08100000000000002, False, False) name module.module.external_feature_model.vit.decoder.layers.18.mlp.linear_fc2.bias lr_decay_rate 0.531441name module.module.external_feature_model.vit.decoder.layers.3.ls1 lr_decay_rate 0.10941898913151242_get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.mlp.linear_fc1.weight key (1.0, 0.016677181699666577, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.mlp.linear_fc1.bias key (0.0, 0.08100000000000002, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.mlp.linear_fc2.weight key (1.0, 0.028242953648100012, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.mlp.linear_fc1.bias key (0.0, 0.08100000000000002, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.input_layernorm.bias key (0.0, 0.012157665459056936, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.mlp.linear_fc2.bias key (0.0, 0.05904900000000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.pre_mlp_layernorm.bias key (0.0, 0.0729, False, False) name module.module.external_feature_model.vit.decoder.layers.21.mlp.linear_fc2.weight lr_decay_rate 0.7290000000000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.self_attention.linear_qkv.bias key (0.0, 0.0729, False, False)_get_param_groups name module.module.decoder.layers.10.self_attention.linear_proj.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.12.input_layernorm.weight lr_decay_rate 0.2824295364810001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.mlp.linear_fc2.bias key (0.0, 0.05314410000000001, False, False)name module.module.external_feature_model.vit.decoder.layers.22.mlp.linear_fc1.weight lr_decay_rate 0.81name module.module.external_feature_model.vit.decoder.layers.12.mlp.linear_fc2.bias lr_decay_rate 0.2824295364810001name module.module.external_feature_model.vit.decoder.layers.21.ls1 lr_decay_rate 0.7290000000000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.ls1 key (0.0, 0.010941898913151242, False, False)name module.module.external_feature_model.vit.decoder.layers.7.mlp.linear_fc1.bias lr_decay_rate 0.16677181699666577 name module.module.external_feature_model.vit.decoder.layers.22.mlp.linear_fc2.weight lr_decay_rate 0.81name module.module.external_feature_model.vit.decoder.layers.22.mlp.linear_fc2.weight lr_decay_rate 0.81name module.module.external_feature_model.vit.decoder.layers.20.ls1 lr_decay_rate 0.6561_get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.mlp.linear_fc2.weight key (1.0, 0.0729, False, False)name module.module.external_feature_model.vit.decoder.layers.4.self_attention.linear_proj.weight lr_decay_rate 0.12157665459056935 name module.module.external_feature_model.vit.decoder.layers.21.mlp.linear_fc1.weight lr_decay_rate 0.7290000000000001 _get_param_groups name module.module.decoder.layers.10.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.mlp.linear_fc1.bias key (0.0, 0.016677181699666577, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.input_layernorm.weight key (0.0, 0.028242953648100012, False, False) name module.module.external_feature_model.vit.decoder.layers.3.ls2 lr_decay_rate 0.10941898913151242_get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.mlp.linear_fc2.bias key (0.0, 0.028242953648100012, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.mlp.linear_fc1.weight key (1.0, 0.08100000000000002, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.ls1 key (0.0, 0.0729, False, False) name module.module.external_feature_model.vit.decoder.layers.19.ls1 lr_decay_rate 0.5904900000000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.mlp.linear_fc2.weight key (1.0, 0.08100000000000002, False, False)name module.module.external_feature_model.vit.decoder.layers.21.pre_mlp_layernorm.weight lr_decay_rate 0.7290000000000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.self_attention.linear_proj.weight key (1.0, 0.012157665459056936, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.mlp.linear_fc2.weight key (1.0, 0.08100000000000002, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.mlp.linear_fc1.weight key (1.0, 0.0729, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.ls1 key (0.0, 0.06561, False, False)name module.module.external_feature_model.vit.decoder.layers.21.mlp.linear_fc2.bias lr_decay_rate 0.7290000000000001_get_param_groups name module.module.decoder.layers.10.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.7.mlp.linear_fc2.weight lr_decay_rate 0.16677181699666577 name module.module.external_feature_model.vit.decoder.layers.22.mlp.linear_fc2.bias lr_decay_rate 0.81_get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.pre_mlp_layernorm.weight key (0.0, 0.0729, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.ls2 key (0.0, 0.010941898913151242, False, False) name module.module.external_feature_model.vit.decoder.layers.22.mlp.linear_fc2.bias lr_decay_rate 0.81 name module.module.external_feature_model.vit.decoder.layers.12.input_layernorm.bias lr_decay_rate 0.2824295364810001name module.module.external_feature_model.vit.decoder.layers.13.ls1 lr_decay_rate 0.31381059609000006 name module.module.external_feature_model.vit.decoder.layers.22.mlp.linear_fc1.bias lr_decay_rate 0.81 name module.module.external_feature_model.vit.decoder.layers.21.ls2 lr_decay_rate 0.7290000000000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.ls1 key (0.0, 0.05904900000000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.mlp.linear_fc2.bias key (0.0, 0.0729, False, False) name module.module.external_feature_model.vit.decoder.layers.4.self_attention.linear_proj.bias lr_decay_rate 0.12157665459056935name module.module.external_feature_model.vit.decoder.layers.21.mlp.linear_fc1.bias lr_decay_rate 0.7290000000000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.mlp.linear_fc2.bias key (0.0, 0.08100000000000002, False, False) _get_param_groups name module.module.decoder.layers.10.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.20.ls2 lr_decay_rate 0.6561name module.module.external_feature_model.vit.decoder.layers.21.pre_mlp_layernorm.bias lr_decay_rate 0.7290000000000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.mlp.linear_fc2.bias key (0.0, 0.08100000000000002, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.mlp.linear_fc2.weight key (1.0, 0.016677181699666577, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.ls2 key (0.0, 0.0729, False, False) name module.module.external_feature_model.vit.decoder.layers.3.input_layernorm.weight lr_decay_rate 0.10941898913151242 name module.module.external_feature_model.vit.decoder.layers.22.ls1 lr_decay_rate 0.81_get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.input_layernorm.bias key (0.0, 0.028242953648100012, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.mlp.linear_fc1.bias key (0.0, 0.08100000000000002, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.ls1 key (0.0, 0.031381059609000006, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.mlp.linear_fc1.bias key (0.0, 0.0729, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.pre_mlp_layernorm.bias key (0.0, 0.0729, False, False)name module.module.external_feature_model.vit.decoder.layers.19.ls2 lr_decay_rate 0.5904900000000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.self_attention.linear_proj.bias key (0.0, 0.012157665459056936, False, False) name module.module.external_feature_model.vit.decoder.layers.23.ls1 lr_decay_rate 0.9_get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.ls1 key (0.0, 0.08100000000000002, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.ls2 key (0.0, 0.06561, False, False)_get_param_groups name module.module.decoder.layers.10.mlp.linear_fc1.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.21.input_layernorm.weight lr_decay_rate 0.7290000000000001 name module.module.external_feature_model.vit.decoder.layers.7.mlp.linear_fc2.bias lr_decay_rate 0.16677181699666577 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.input_layernorm.weight key (0.0, 0.010941898913151242, False, False) name module.module.external_feature_model.vit.decoder.layers.23.ls1 lr_decay_rate 0.9 name module.module.external_feature_model.vit.decoder.layers.12.self_attention.linear_proj.weight lr_decay_rate 0.2824295364810001name module.module.external_feature_model.vit.decoder.layers.22.mlp.linear_fc2.weight lr_decay_rate 0.81name module.module.external_feature_model.vit.decoder.layers.13.ls2 lr_decay_rate 0.31381059609000006 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.ls2 key (0.0, 0.05904900000000001, False, False)name module.module.external_feature_model.vit.decoder.layers.21.mlp.linear_fc1.weight lr_decay_rate 0.7290000000000001name module.module.external_feature_model.vit.decoder.layers.21.mlp.linear_fc2.weight lr_decay_rate 0.7290000000000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.ls1 key (0.0, 0.09000000000000001, False, False)name module.module.external_feature_model.vit.decoder.layers.4.self_attention.linear_qkv.weight lr_decay_rate 0.12157665459056935name module.module.external_feature_model.vit.decoder.layers.20.input_layernorm.weight lr_decay_rate 0.6561 name module.module.external_feature_model.vit.decoder.layers.22.ls2 lr_decay_rate 0.81_get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.input_layernorm.weight key (0.0, 0.0729, False, False)name module.module.external_feature_model.vit.decoder.layers.3.input_layernorm.bias lr_decay_rate 0.10941898913151242_get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.mlp.linear_fc2.bias key (0.0, 0.016677181699666577, False, False)_get_param_groups name module.module.decoder.layers.10.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.ls2 key (0.0, 0.031381059609000006, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.ls1 key (0.0, 0.09000000000000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.mlp.linear_fc2.weight key (1.0, 0.08100000000000002, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.mlp.linear_fc2.weight key (1.0, 0.0729, False, False)name module.module.external_feature_model.vit.decoder.layers.19.input_layernorm.weight lr_decay_rate 0.5904900000000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.self_attention.linear_proj.weight key (1.0, 0.028242953648100012, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.mlp.linear_fc1.weight key (1.0, 0.0729, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.self_attention.linear_qkv.weight key (1.0, 0.012157665459056936, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.input_layernorm.weight key (0.0, 0.06561, False, False) name module.module.external_feature_model.vit.decoder.layers.21.input_layernorm.bias lr_decay_rate 0.7290000000000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.ls2 key (0.0, 0.08100000000000002, False, False)name module.module.external_feature_model.vit.decoder.layers.13.input_layernorm.weight lr_decay_rate 0.31381059609000006 name module.module.external_feature_model.vit.decoder.layers.23.ls2 lr_decay_rate 0.9_get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.input_layernorm.bias key (0.0, 0.010941898913151242, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.input_layernorm.weight key (0.0, 0.05904900000000001, False, False)name module.module.external_feature_model.vit.decoder.layers.8.ls1 lr_decay_rate 0.18530201888518416 name module.module.external_feature_model.vit.decoder.layers.12.self_attention.linear_proj.bias lr_decay_rate 0.2824295364810001 _get_param_groups name module.module.decoder.layers.11.input_layernorm.weight key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.21.mlp.linear_fc2.bias lr_decay_rate 0.7290000000000001name module.module.external_feature_model.vit.decoder.layers.4.self_attention.linear_qkv.bias lr_decay_rate 0.12157665459056935 name module.module.external_feature_model.vit.decoder.layers.23.ls2 lr_decay_rate 0.9name module.module.external_feature_model.vit.decoder.layers.22.mlp.linear_fc2.bias lr_decay_rate 0.81 name module.module.external_feature_model.vit.decoder.layers.21.mlp.linear_fc1.bias lr_decay_rate 0.7290000000000001 name module.module.external_feature_model.vit.decoder.layers.20.input_layernorm.bias lr_decay_rate 0.6561_get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.input_layernorm.weight key (0.0, 0.031381059609000006, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.input_layernorm.bias key (0.0, 0.0729, False, False) name module.module.external_feature_model.vit.decoder.layers.22.input_layernorm.weight lr_decay_rate 0.81_get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.ls2 key (0.0, 0.09000000000000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.ls1 key (0.0, 0.018530201888518418, False, False) name module.module.external_feature_model.vit.decoder.layers.19.input_layernorm.bias lr_decay_rate 0.5904900000000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.self_attention.linear_proj.bias key (0.0, 0.028242953648100012, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.mlp.linear_fc2.bias key (0.0, 0.0729, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.self_attention.linear_qkv.bias key (0.0, 0.012157665459056936, False, False) name module.module.external_feature_model.vit.decoder.layers.8.ls2 lr_decay_rate 0.18530201888518416name module.module.external_feature_model.vit.decoder.layers.3.self_attention.linear_proj.weight lr_decay_rate 0.10941898913151242_get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.ls2 key (0.0, 0.09000000000000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.mlp.linear_fc2.bias key (0.0, 0.08100000000000002, False, False)_get_param_groups name module.module.decoder.layers.11.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.mlp.linear_fc1.bias key (0.0, 0.0729, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.input_layernorm.bias key (0.0, 0.06561, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.input_layernorm.weight key (0.0, 0.08100000000000002, False, False)name module.module.external_feature_model.vit.decoder.layers.23.input_layernorm.weight lr_decay_rate 0.9name module.module.external_feature_model.vit.decoder.layers.13.input_layernorm.bias lr_decay_rate 0.31381059609000006name module.module.external_feature_model.vit.decoder.layers.21.self_attention.linear_proj.weight lr_decay_rate 0.7290000000000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.input_layernorm.bias key (0.0, 0.05904900000000001, False, False)name module.module.external_feature_model.vit.decoder.layers.22.ls1 lr_decay_rate 0.81_get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.self_attention.linear_proj.weight key (1.0, 0.010941898913151242, False, False) _get_param_groups name module.module.decoder.layers.11.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.12.self_attention.linear_qkv.weight lr_decay_rate 0.2824295364810001name module.module.external_feature_model.vit.decoder.layers.23.ls1 lr_decay_rate 0.9 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.ls2 key (0.0, 0.018530201888518418, False, False)name module.module.external_feature_model.vit.decoder.layers.4.pre_mlp_layernorm.weight lr_decay_rate 0.12157665459056935_get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.input_layernorm.bias key (0.0, 0.031381059609000006, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.input_layernorm.weight key (0.0, 0.09000000000000001, False, False)name module.module.external_feature_model.vit.decoder.layers.21.mlp.linear_fc2.weight lr_decay_rate 0.7290000000000001name module.module.external_feature_model.vit.decoder.layers.20.self_attention.linear_proj.weight lr_decay_rate 0.6561name module.module.external_feature_model.vit.decoder.layers.22.input_layernorm.bias lr_decay_rate 0.81 name module.module.external_feature_model.vit.decoder.layers.23.input_layernorm.weight lr_decay_rate 0.9_get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.self_attention.linear_proj.weight key (1.0, 0.0729, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.ls1 key (0.0, 0.08100000000000002, False, False) _get_param_groups name module.module.decoder.layers.11.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.19.self_attention.linear_proj.weight lr_decay_rate 0.5904900000000001name module.module.external_feature_model.vit.decoder.layers.3.self_attention.linear_proj.bias lr_decay_rate 0.10941898913151242_get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.self_attention.linear_qkv.weight key (1.0, 0.028242953648100012, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.self_attention.linear_proj.weight key (1.0, 0.06561, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.input_layernorm.bias key (0.0, 0.08100000000000002, False, False) name module.module.external_feature_model.vit.decoder.layers.8.input_layernorm.weight lr_decay_rate 0.18530201888518416_get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.ls1 key (0.0, 0.09000000000000001, False, False) name module.module.external_feature_model.vit.decoder.layers.13.self_attention.linear_proj.weight lr_decay_rate 0.31381059609000006_get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.pre_mlp_layernorm.weight key (0.0, 0.012157665459056936, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.mlp.linear_fc2.weight key (1.0, 0.0729, False, False)name module.module.external_feature_model.vit.decoder.layers.23.input_layernorm.bias lr_decay_rate 0.9name module.module.external_feature_model.vit.decoder.layers.21.self_attention.linear_proj.bias lr_decay_rate 0.7290000000000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.input_layernorm.weight key (0.0, 0.09000000000000001, False, False) name module.module.external_feature_model.vit.decoder.layers.22.ls2 lr_decay_rate 0.81name module.module.external_feature_model.vit.decoder.layers.12.self_attention.linear_qkv.bias lr_decay_rate 0.2824295364810001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.self_attention.linear_proj.bias key (0.0, 0.010941898913151242, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.self_attention.linear_proj.weight key (1.0, 0.05904900000000001, False, False)name module.module.external_feature_model.vit.decoder.layers.4.pre_mlp_layernorm.bias lr_decay_rate 0.12157665459056935 _get_param_groups name module.module.decoder.layers.11.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.input_layernorm.bias key (0.0, 0.09000000000000001, False, False)name module.module.external_feature_model.vit.decoder.layers.20.self_attention.linear_proj.bias lr_decay_rate 0.6561_get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.self_attention.linear_proj.weight key (1.0, 0.031381059609000006, False, False) name module.module.external_feature_model.vit.decoder.layers.22.self_attention.linear_proj.weight lr_decay_rate 0.81 name module.module.external_feature_model.vit.decoder.layers.23.input_layernorm.bias lr_decay_rate 0.9 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.input_layernorm.weight key (0.0, 0.018530201888518418, False, False)name module.module.external_feature_model.vit.decoder.layers.23.ls2 lr_decay_rate 0.9_get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.self_attention.linear_proj.bias key (0.0, 0.0729, False, False)name module.module.external_feature_model.vit.decoder.layers.21.mlp.linear_fc2.bias lr_decay_rate 0.7290000000000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.ls2 key (0.0, 0.08100000000000002, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.self_attention.linear_qkv.bias key (0.0, 0.028242953648100012, False, False) _get_param_groups name module.module.decoder.layers.11.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.self_attention.linear_proj.bias key (0.0, 0.06561, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.pre_mlp_layernorm.bias key (0.0, 0.012157665459056936, False, False) name module.module.external_feature_model.vit.decoder.layers.3.self_attention.linear_qkv.weight lr_decay_rate 0.10941898913151242name module.module.external_feature_model.vit.decoder.layers.19.self_attention.linear_proj.bias lr_decay_rate 0.5904900000000001name module.module.external_feature_model.vit.decoder.layers.21.self_attention.linear_qkv.weight lr_decay_rate 0.7290000000000001name module.module.external_feature_model.vit.decoder.layers.13.self_attention.linear_proj.bias lr_decay_rate 0.31381059609000006 name module.module.external_feature_model.vit.decoder.layers.8.input_layernorm.bias lr_decay_rate 0.18530201888518416_get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.self_attention.linear_proj.weight key (1.0, 0.08100000000000002, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.input_layernorm.bias key (0.0, 0.09000000000000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.ls2 key (0.0, 0.09000000000000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.mlp.linear_fc2.bias key (0.0, 0.0729, False, False) name module.module.external_feature_model.vit.decoder.layers.23.self_attention.linear_proj.weight lr_decay_rate 0.9 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.self_attention.linear_proj.bias key (0.0, 0.05904900000000001, False, False)_get_param_groups name module.module.decoder.layers.11.mlp.linear_fc2.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.22.input_layernorm.weight lr_decay_rate 0.81name module.module.external_feature_model.vit.decoder.layers.20.self_attention.linear_qkv.weight lr_decay_rate 0.6561 name module.module.external_feature_model.vit.decoder.layers.4.mlp.linear_fc1.weight lr_decay_rate 0.12157665459056935 name module.module.external_feature_model.vit.decoder.layers.12.pre_mlp_layernorm.weight lr_decay_rate 0.2824295364810001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.input_layernorm.bias key (0.0, 0.018530201888518418, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.self_attention.linear_qkv.weight key (1.0, 0.010941898913151242, False, False)name module.module.external_feature_model.vit.decoder.layers.22.self_attention.linear_proj.bias lr_decay_rate 0.81_get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.self_attention.linear_qkv.weight key (1.0, 0.0729, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.self_attention.linear_proj.bias key (0.0, 0.031381059609000006, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.self_attention.linear_proj.weight key (1.0, 0.09000000000000001, False, False)name module.module.external_feature_model.vit.decoder.layers.23.self_attention.linear_proj.weight lr_decay_rate 0.9name module.module.external_feature_model.vit.decoder.layers.22.ls1 lr_decay_rate 0.81 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.input_layernorm.weight key (0.0, 0.08100000000000002, False, False)name module.module.external_feature_model.vit.decoder.layers.19.self_attention.linear_qkv.weight lr_decay_rate 0.5904900000000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.mlp.linear_fc1.weight key (1.0, 0.012157665459056936, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.self_attention.linear_qkv.weight key (1.0, 0.06561, False, False) _get_param_groups name module.module.decoder.layers.12.input_layernorm.weight key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.23.input_layernorm.weight lr_decay_rate 0.9 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.pre_mlp_layernorm.weight key (0.0, 0.028242953648100012, False, False)name module.module.external_feature_model.vit.decoder.layers.21.self_attention.linear_qkv.bias lr_decay_rate 0.7290000000000001 name module.module.external_feature_model.vit.decoder.layers.8.self_attention.linear_proj.weight lr_decay_rate 0.18530201888518416 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.self_attention.linear_proj.bias key (0.0, 0.08100000000000002, False, False) name module.module.external_feature_model.vit.decoder.layers.23.self_attention.linear_proj.bias lr_decay_rate 0.9name module.module.external_feature_model.vit.decoder.layers.3.self_attention.linear_qkv.bias lr_decay_rate 0.10941898913151242name module.module.external_feature_model.vit.decoder.layers.4.mlp.linear_fc1.bias lr_decay_rate 0.12157665459056935 name module.module.external_feature_model.vit.decoder.layers.13.self_attention.linear_qkv.weight lr_decay_rate 0.31381059609000006_get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.self_attention.linear_proj.weight key (1.0, 0.09000000000000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.ls1 key (0.0, 0.08100000000000002, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.input_layernorm.weight key (0.0, 0.09000000000000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.self_attention.linear_qkv.weight key (1.0, 0.05904900000000001, False, False)_get_param_groups name module.module.decoder.layers.12.self_attention.linear_proj.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.22.input_layernorm.bias lr_decay_rate 0.81 name module.module.external_feature_model.vit.decoder.layers.20.self_attention.linear_qkv.bias lr_decay_rate 0.6561 name module.module.external_feature_model.vit.decoder.layers.12.pre_mlp_layernorm.bias lr_decay_rate 0.2824295364810001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.self_attention.linear_proj.weight key (1.0, 0.018530201888518418, False, False)name module.module.external_feature_model.vit.decoder.layers.22.self_attention.linear_qkv.weight lr_decay_rate 0.81 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.mlp.linear_fc1.bias key (0.0, 0.012157665459056936, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.self_attention.linear_qkv.bias key (0.0, 0.0729, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.self_attention.linear_qkv.bias key (0.0, 0.010941898913151242, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.self_attention.linear_proj.bias key (0.0, 0.09000000000000001, False, False) name module.module.external_feature_model.vit.decoder.layers.22.ls2 lr_decay_rate 0.81name module.module.external_feature_model.vit.decoder.layers.23.input_layernorm.bias lr_decay_rate 0.9 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.self_attention.linear_qkv.weight key (1.0, 0.031381059609000006, False, False)name module.module.external_feature_model.vit.decoder.layers.23.self_attention.linear_proj.bias lr_decay_rate 0.9 name module.module.external_feature_model.vit.decoder.layers.19.self_attention.linear_qkv.bias lr_decay_rate 0.5904900000000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.pre_mlp_layernorm.bias key (0.0, 0.028242953648100012, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.self_attention.linear_qkv.weight key (1.0, 0.08100000000000002, False, False) _get_param_groups name module.module.decoder.layers.12.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.self_attention.linear_qkv.bias key (0.0, 0.06561, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.input_layernorm.bias key (0.0, 0.08100000000000002, False, False) name module.module.external_feature_model.vit.decoder.layers.8.self_attention.linear_proj.bias lr_decay_rate 0.18530201888518416 name module.module.external_feature_model.vit.decoder.layers.4.mlp.linear_fc2.weight lr_decay_rate 0.12157665459056935_get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.ls2 key (0.0, 0.08100000000000002, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.self_attention.linear_qkv.bias key (0.0, 0.05904900000000001, False, False) name module.module.external_feature_model.vit.decoder.layers.3.pre_mlp_layernorm.weight lr_decay_rate 0.10941898913151242 name module.module.external_feature_model.vit.decoder.layers.23.self_attention.linear_qkv.weight lr_decay_rate 0.9name module.module.external_feature_model.vit.decoder.layers.21.pre_mlp_layernorm.weight lr_decay_rate 0.7290000000000001_get_param_groups name module.module.decoder.layers.12.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.input_layernorm.bias key (0.0, 0.09000000000000001, False, False) name module.module.external_feature_model.vit.decoder.layers.13.self_attention.linear_qkv.bias lr_decay_rate 0.31381059609000006name module.module.external_feature_model.vit.decoder.layers.12.mlp.linear_fc1.weight lr_decay_rate 0.2824295364810001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.self_attention.linear_proj.bias key (0.0, 0.09000000000000001, False, False) name module.module.external_feature_model.vit.decoder.layers.22.self_attention.linear_qkv.bias lr_decay_rate 0.81 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.self_attention.linear_proj.bias key (0.0, 0.018530201888518418, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.mlp.linear_fc2.weight key (1.0, 0.012157665459056936, False, False) name module.module.external_feature_model.vit.decoder.layers.20.pre_mlp_layernorm.weight lr_decay_rate 0.6561_get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.self_attention.linear_qkv.weight key (1.0, 0.09000000000000001, False, False) name module.module.external_feature_model.vit.decoder.layers.22.self_attention.linear_proj.weight lr_decay_rate 0.81name module.module.external_feature_model.vit.decoder.layers.19.pre_mlp_layernorm.weight lr_decay_rate 0.5904900000000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.pre_mlp_layernorm.weight key (0.0, 0.0729, False, False) name module.module.external_feature_model.vit.decoder.layers.22.input_layernorm.weight lr_decay_rate 0.81 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.pre_mlp_layernorm.weight key (0.0, 0.010941898913151242, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.self_attention.linear_qkv.bias key (0.0, 0.031381059609000006, False, False) _get_param_groups name module.module.decoder.layers.12.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.23.self_attention.linear_qkv.weight lr_decay_rate 0.9_get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.mlp.linear_fc1.weight key (1.0, 0.028242953648100012, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.self_attention.linear_qkv.bias key (0.0, 0.08100000000000002, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.pre_mlp_layernorm.weight key (0.0, 0.06561, False, False)name module.module.external_feature_model.vit.decoder.layers.4.mlp.linear_fc2.bias lr_decay_rate 0.12157665459056935 name module.module.external_feature_model.vit.decoder.layers.23.self_attention.linear_qkv.bias lr_decay_rate 0.9 name module.module.external_feature_model.vit.decoder.layers.23.self_attention.linear_proj.weight lr_decay_rate 0.9 name module.module.external_feature_model.vit.decoder.layers.8.self_attention.linear_qkv.weight lr_decay_rate 0.18530201888518416_get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.self_attention.linear_proj.weight key (1.0, 0.08100000000000002, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.pre_mlp_layernorm.weight key (0.0, 0.05904900000000001, False, False)name module.module.external_feature_model.vit.decoder.layers.21.pre_mlp_layernorm.bias lr_decay_rate 0.7290000000000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.input_layernorm.weight key (0.0, 0.08100000000000002, False, False) _get_param_groups name module.module.decoder.layers.12.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.self_attention.linear_qkv.weight key (1.0, 0.09000000000000001, False, False) name module.module.external_feature_model.vit.decoder.layers.13.pre_mlp_layernorm.weight lr_decay_rate 0.31381059609000006 name module.module.external_feature_model.vit.decoder.layers.3.pre_mlp_layernorm.bias lr_decay_rate 0.10941898913151242_get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.self_attention.linear_qkv.bias key (0.0, 0.09000000000000001, False, False) name module.module.external_feature_model.vit.decoder.layers.20.pre_mlp_layernorm.bias lr_decay_rate 0.6561 name module.module.external_feature_model.vit.decoder.layers.12.mlp.linear_fc1.bias lr_decay_rate 0.2824295364810001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.mlp.linear_fc2.bias key (0.0, 0.012157665459056936, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.self_attention.linear_qkv.weight key (1.0, 0.018530201888518418, False, False)name module.module.external_feature_model.vit.decoder.layers.22.pre_mlp_layernorm.weight lr_decay_rate 0.81 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.self_attention.linear_proj.weight key (1.0, 0.09000000000000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.pre_mlp_layernorm.bias key (0.0, 0.0729, False, False)name module.module.external_feature_model.vit.decoder.layers.19.pre_mlp_layernorm.bias lr_decay_rate 0.5904900000000001name module.module.external_feature_model.vit.decoder.layers.22.self_attention.linear_proj.bias lr_decay_rate 0.81name module.module.external_feature_model.vit.decoder.layers.22.input_layernorm.bias lr_decay_rate 0.81 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.pre_mlp_layernorm.bias key (0.0, 0.06561, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.mlp.linear_fc1.bias key (0.0, 0.028242953648100012, False, False) _get_param_groups name module.module.decoder.layers.12.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.pre_mlp_layernorm.weight key (0.0, 0.031381059609000006, False, False)name module.module.external_feature_model.vit.decoder.layers.8.self_attention.linear_qkv.bias lr_decay_rate 0.18530201888518416 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.pre_mlp_layernorm.bias key (0.0, 0.010941898913151242, False, False) name module.module.external_feature_model.vit.decoder.layers.23.self_attention.linear_qkv.bias lr_decay_rate 0.9 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.pre_mlp_layernorm.bias key (0.0, 0.05904900000000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.pre_mlp_layernorm.weight key (0.0, 0.08100000000000002, False, False) name module.module.external_feature_model.vit.decoder.layers.5.ls1 lr_decay_rate 0.13508517176729928name module.module.external_feature_model.vit.decoder.layers.23.self_attention.linear_proj.bias lr_decay_rate 0.9 name module.module.external_feature_model.vit.decoder.layers.23.pre_mlp_layernorm.weight lr_decay_rate 0.9 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.input_layernorm.bias key (0.0, 0.08100000000000002, False, False)name module.module.external_feature_model.vit.decoder.layers.21.mlp.linear_fc1.weight lr_decay_rate 0.7290000000000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.self_attention.linear_proj.bias key (0.0, 0.08100000000000002, False, False) _get_param_groups name module.module.decoder.layers.13.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.self_attention.linear_qkv.bias key (0.0, 0.018530201888518418, False, False)name module.module.external_feature_model.vit.decoder.layers.20.mlp.linear_fc1.weight lr_decay_rate 0.6561name module.module.external_feature_model.vit.decoder.layers.13.pre_mlp_layernorm.bias lr_decay_rate 0.31381059609000006 name module.module.external_feature_model.vit.decoder.layers.12.mlp.linear_fc2.weight lr_decay_rate 0.2824295364810001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.self_attention.linear_qkv.bias key (0.0, 0.09000000000000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.ls1 key (0.0, 0.013508517176729929, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.self_attention.linear_proj.bias key (0.0, 0.09000000000000001, False, False)name module.module.external_feature_model.vit.decoder.layers.3.mlp.linear_fc1.weight lr_decay_rate 0.10941898913151242name module.module.external_feature_model.vit.decoder.layers.22.pre_mlp_layernorm.bias lr_decay_rate 0.81_get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.mlp.linear_fc1.weight key (1.0, 0.0729, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.mlp.linear_fc1.weight key (1.0, 0.06561, False, False)name module.module.external_feature_model.vit.decoder.layers.19.mlp.linear_fc1.weight lr_decay_rate 0.5904900000000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.pre_mlp_layernorm.weight key (0.0, 0.09000000000000001, False, False) name module.module.external_feature_model.vit.decoder.layers.22.self_attention.linear_proj.weight lr_decay_rate 0.81_get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.pre_mlp_layernorm.bias key (0.0, 0.031381059609000006, False, False)_get_param_groups name module.module.decoder.layers.13.self_attention.linear_proj.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.22.self_attention.linear_qkv.weight lr_decay_rate 0.81_get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.mlp.linear_fc2.weight key (1.0, 0.028242953648100012, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.pre_mlp_layernorm.bias key (0.0, 0.08100000000000002, False, False)name module.module.external_feature_model.vit.decoder.layers.8.pre_mlp_layernorm.weight lr_decay_rate 0.18530201888518416name module.module.external_feature_model.vit.decoder.layers.23.pre_mlp_layernorm.weight lr_decay_rate 0.9 name module.module.external_feature_model.vit.decoder.layers.20.mlp.linear_fc1.bias lr_decay_rate 0.6561 name module.module.external_feature_model.vit.decoder.layers.5.ls2 lr_decay_rate 0.13508517176729928_get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.mlp.linear_fc1.weight key (1.0, 0.010941898913151242, False, False)name module.module.external_feature_model.vit.decoder.layers.21.mlp.linear_fc1.bias lr_decay_rate 0.7290000000000001name module.module.external_feature_model.vit.decoder.layers.23.self_attention.linear_qkv.weight lr_decay_rate 0.9name module.module.external_feature_model.vit.decoder.layers.23.pre_mlp_layernorm.bias lr_decay_rate 0.9_get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.mlp.linear_fc1.weight key (1.0, 0.05904900000000001, False, False) _get_param_groups name module.module.decoder.layers.13.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.self_attention.linear_proj.weight key (1.0, 0.08100000000000002, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.self_attention.linear_qkv.weight key (1.0, 0.08100000000000002, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.mlp.linear_fc1.bias key (0.0, 0.06561, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.mlp.linear_fc1.bias key (0.0, 0.0729, False, False)name module.module.external_feature_model.vit.decoder.layers.13.mlp.linear_fc1.weight lr_decay_rate 0.31381059609000006_get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.pre_mlp_layernorm.weight key (0.0, 0.018530201888518418, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.pre_mlp_layernorm.bias key (0.0, 0.09000000000000001, False, False)name module.module.external_feature_model.vit.decoder.layers.12.mlp.linear_fc2.bias lr_decay_rate 0.2824295364810001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.pre_mlp_layernorm.weight key (0.0, 0.09000000000000001, False, False)name module.module.external_feature_model.vit.decoder.layers.22.mlp.linear_fc1.weight lr_decay_rate 0.81_get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.ls2 key (0.0, 0.013508517176729929, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.self_attention.linear_qkv.weight key (1.0, 0.09000000000000001, False, False) name module.module.external_feature_model.vit.decoder.layers.3.mlp.linear_fc1.bias lr_decay_rate 0.10941898913151242 _get_param_groups name module.module.decoder.layers.13.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.22.self_attention.linear_proj.bias lr_decay_rate 0.81name module.module.external_feature_model.vit.decoder.layers.20.mlp.linear_fc2.weight lr_decay_rate 0.6561 name module.module.external_feature_model.vit.decoder.layers.19.mlp.linear_fc1.bias lr_decay_rate 0.5904900000000001 name module.module.external_feature_model.vit.decoder.layers.22.self_attention.linear_qkv.bias lr_decay_rate 0.81 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.mlp.linear_fc2.bias key (0.0, 0.028242953648100012, False, False) name module.module.external_feature_model.vit.decoder.layers.8.pre_mlp_layernorm.bias lr_decay_rate 0.18530201888518416name module.module.external_feature_model.vit.decoder.layers.5.input_layernorm.weight lr_decay_rate 0.13508517176729928 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.mlp.linear_fc1.weight key (1.0, 0.031381059609000006, False, False) name module.module.external_feature_model.vit.decoder.layers.21.mlp.linear_fc2.weight lr_decay_rate 0.7290000000000001name module.module.external_feature_model.vit.decoder.layers.23.self_attention.linear_qkv.bias lr_decay_rate 0.9 name module.module.external_feature_model.vit.decoder.layers.23.mlp.linear_fc1.weight lr_decay_rate 0.9_get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.mlp.linear_fc1.weight key (1.0, 0.08100000000000002, False, False)name module.module.external_feature_model.vit.decoder.layers.23.pre_mlp_layernorm.bias lr_decay_rate 0.9_get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.mlp.linear_fc1.bias key (0.0, 0.05904900000000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.mlp.linear_fc1.bias key (0.0, 0.010941898913151242, False, False) _get_param_groups name module.module.decoder.layers.13.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.self_attention.linear_proj.bias key (0.0, 0.08100000000000002, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.mlp.linear_fc2.weight key (1.0, 0.06561, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.input_layernorm.weight key (0.0, 0.013508517176729929, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.self_attention.linear_qkv.bias key (0.0, 0.08100000000000002, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.pre_mlp_layernorm.bias key (0.0, 0.018530201888518418, False, False) name module.module.external_feature_model.vit.decoder.layers.13.ls1 lr_decay_rate 0.31381059609000006 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.mlp.linear_fc2.weight key (1.0, 0.0729, False, False)name module.module.external_feature_model.vit.decoder.layers.13.mlp.linear_fc1.bias lr_decay_rate 0.31381059609000006_get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.self_attention.linear_qkv.bias key (0.0, 0.09000000000000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.pre_mlp_layernorm.bias key (0.0, 0.09000000000000001, False, False)name module.module.external_feature_model.vit.decoder.layers.22.self_attention.linear_qkv.weight lr_decay_rate 0.81_get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.mlp.linear_fc1.weight key (1.0, 0.09000000000000001, False, False)_get_param_groups name module.module.decoder.layers.13.mlp.linear_fc1.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.22.mlp.linear_fc1.bias lr_decay_rate 0.81name module.module.external_feature_model.vit.decoder.layers.3.mlp.linear_fc2.weight lr_decay_rate 0.10941898913151242 name module.module.external_feature_model.vit.decoder.layers.19.mlp.linear_fc2.weight lr_decay_rate 0.5904900000000001name module.module.external_feature_model.vit.decoder.layers.20.mlp.linear_fc2.bias lr_decay_rate 0.6561_get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.ls1 key (0.0, 0.031381059609000006, False, False) name module.module.external_feature_model.vit.decoder.layers.5.input_layernorm.bias lr_decay_rate 0.13508517176729928name module.module.external_feature_model.vit.decoder.layers.8.mlp.linear_fc1.weight lr_decay_rate 0.18530201888518416name module.module.external_feature_model.vit.decoder.layers.22.pre_mlp_layernorm.weight lr_decay_rate 0.81_get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.mlp.linear_fc1.bias key (0.0, 0.08100000000000002, False, False) name module.module.external_feature_model.vit.decoder.layers.21.mlp.linear_fc2.bias lr_decay_rate 0.7290000000000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.mlp.linear_fc1.bias key (0.0, 0.031381059609000006, False, False) _get_param_groups name module.module.decoder.layers.13.mlp.linear_fc2.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.23.mlp.linear_fc1.bias lr_decay_rate 0.9 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.mlp.linear_fc2.bias key (0.0, 0.06561, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.self_attention.linear_qkv.weight key (1.0, 0.08100000000000002, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.mlp.linear_fc2.weight key (1.0, 0.010941898913151242, False, False) name module.module.external_feature_model.vit.decoder.layers.23.mlp.linear_fc1.weight lr_decay_rate 0.9_get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.mlp.linear_fc2.weight key (1.0, 0.05904900000000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.input_layernorm.bias key (0.0, 0.013508517176729929, False, False) name module.module.external_feature_model.vit.decoder.layers.23.pre_mlp_layernorm.weight lr_decay_rate 0.9name module.module.external_feature_model.vit.decoder.layers.22.mlp.linear_fc2.weight lr_decay_rate 0.81 name module.module.external_feature_model.vit.decoder.layers.13.ls2 lr_decay_rate 0.31381059609000006 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.pre_mlp_layernorm.weight key (0.0, 0.08100000000000002, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.mlp.linear_fc2.bias key (0.0, 0.0729, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.mlp.linear_fc1.weight key (1.0, 0.018530201888518418, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.mlp.linear_fc1.weight key (1.0, 0.09000000000000001, False, False)name module.module.external_feature_model.vit.decoder.layers.21.ls1 lr_decay_rate 0.7290000000000001 name module.module.external_feature_model.vit.decoder.layers.19.mlp.linear_fc2.bias lr_decay_rate 0.5904900000000001name module.module.external_feature_model.vit.decoder.layers.22.self_attention.linear_qkv.bias lr_decay_rate 0.81_get_param_groups name module.module.decoder.layers.14.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.mlp.linear_fc1.bias key (0.0, 0.09000000000000001, False, False)name module.module.external_feature_model.vit.decoder.layers.13.mlp.linear_fc2.weight lr_decay_rate 0.31381059609000006 name module.module.external_feature_model.vit.decoder.layers.3.mlp.linear_fc2.bias lr_decay_rate 0.10941898913151242 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.mlp.linear_fc2.weight key (1.0, 0.08100000000000002, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.pre_mlp_layernorm.weight key (0.0, 0.09000000000000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.ls2 key (0.0, 0.031381059609000006, False, False) name module.module.external_feature_model.vit.decoder.layers.22.pre_mlp_layernorm.bias lr_decay_rate 0.81name module.module.external_feature_model.vit.decoder.layers.23.mlp.linear_fc1.bias lr_decay_rate 0.9 name module.module.external_feature_model.vit.decoder.layers.8.mlp.linear_fc1.bias lr_decay_rate 0.18530201888518416 name module.module.external_feature_model.vit.decoder.layers.5.self_attention.linear_proj.weight lr_decay_rate 0.13508517176729928name module.module.external_feature_model.vit.decoder.layers.22.ls1 lr_decay_rate 0.81 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.ls1 key (0.0, 0.0729, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.self_attention.linear_qkv.bias key (0.0, 0.08100000000000002, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.mlp.linear_fc2.bias key (0.0, 0.05904900000000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.mlp.linear_fc2.bias key (0.0, 0.010941898913151242, False, False)name module.module.external_feature_model.vit.decoder.layers.23.mlp.linear_fc2.weight lr_decay_rate 0.9_get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.mlp.linear_fc1.bias key (0.0, 0.09000000000000001, False, False) name module.module.external_feature_model.vit.decoder.layers.22.mlp.linear_fc2.bias lr_decay_rate 0.81 _get_param_groups name module.module.decoder.layers.14.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.mlp.linear_fc2.weight key (1.0, 0.031381059609000006, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.pre_mlp_layernorm.bias key (0.0, 0.08100000000000002, False, False)name module.module.external_feature_model.vit.decoder.layers.23.pre_mlp_layernorm.bias lr_decay_rate 0.9 name module.module.external_feature_model.vit.decoder.layers.13.input_layernorm.weight lr_decay_rate 0.31381059609000006_get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.mlp.linear_fc1.bias key (0.0, 0.018530201888518418, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.self_attention.linear_proj.weight key (1.0, 0.013508517176729929, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.ls1 key (0.0, 0.08100000000000002, False, False) name module.module.external_feature_model.vit.decoder.layers.21.ls2 lr_decay_rate 0.7290000000000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.mlp.linear_fc2.bias key (0.0, 0.08100000000000002, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.mlp.linear_fc2.weight key (1.0, 0.09000000000000001, False, False) name module.module.external_feature_model.vit.decoder.layers.13.mlp.linear_fc2.bias lr_decay_rate 0.31381059609000006name module.module.external_feature_model.vit.decoder.layers.20.ls1 lr_decay_rate 0.6561_get_param_groups name module.module.decoder.layers.14.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.22.pre_mlp_layernorm.weight lr_decay_rate 0.81name module.module.external_feature_model.vit.decoder.layers.4.ls1 lr_decay_rate 0.12157665459056935 name module.module.external_feature_model.vit.decoder.layers.23.mlp.linear_fc2.weight lr_decay_rate 0.9_get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.pre_mlp_layernorm.bias key (0.0, 0.09000000000000001, False, False)name module.module.external_feature_model.vit.decoder.layers.8.mlp.linear_fc2.weight lr_decay_rate 0.18530201888518416 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.input_layernorm.weight key (0.0, 0.031381059609000006, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.ls2 key (0.0, 0.0729, False, False)name module.module.external_feature_model.vit.decoder.layers.22.mlp.linear_fc1.weight lr_decay_rate 0.81name module.module.external_feature_model.vit.decoder.layers.5.self_attention.linear_proj.bias lr_decay_rate 0.13508517176729928 name module.module.external_feature_model.vit.decoder.layers.22.ls2 lr_decay_rate 0.81 name module.module.external_feature_model.vit.decoder.layers.23.ls1 lr_decay_rate 0.9 name module.module.external_feature_model.vit.decoder.layers.23.mlp.linear_fc2.bias lr_decay_rate 0.9 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.mlp.linear_fc2.bias key (0.0, 0.031381059609000006, False, False) _get_param_groups name module.module.decoder.layers.14.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.23.mlp.linear_fc1.weight lr_decay_rate 0.9 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.ls1 key (0.0, 0.06561, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.pre_mlp_layernorm.weight key (0.0, 0.08100000000000002, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.ls1 key (0.0, 0.012157665459056936, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.mlp.linear_fc2.weight key (1.0, 0.09000000000000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.mlp.linear_fc1.weight key (1.0, 0.08100000000000002, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.self_attention.linear_proj.bias key (0.0, 0.013508517176729929, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.mlp.linear_fc2.weight key (1.0, 0.018530201888518418, False, False) name module.module.external_feature_model.vit.decoder.layers.13.input_layernorm.bias lr_decay_rate 0.31381059609000006 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.ls2 key (0.0, 0.08100000000000002, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.ls1 key (0.0, 0.09000000000000001, False, False)name module.module.external_feature_model.vit.decoder.layers.14.ls1 lr_decay_rate 0.3486784401000001 _get_param_groups name module.module.decoder.layers.14.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.21.input_layernorm.weight lr_decay_rate 0.7290000000000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.mlp.linear_fc2.bias key (0.0, 0.09000000000000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.mlp.linear_fc1.weight key (1.0, 0.09000000000000001, False, False)name module.module.external_feature_model.vit.decoder.layers.22.pre_mlp_layernorm.bias lr_decay_rate 0.81 name module.module.external_feature_model.vit.decoder.layers.4.ls2 lr_decay_rate 0.12157665459056935 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.input_layernorm.bias key (0.0, 0.031381059609000006, False, False)name module.module.external_feature_model.vit.decoder.layers.23.mlp.linear_fc2.bias lr_decay_rate 0.9 name module.module.external_feature_model.vit.decoder.layers.20.ls2 lr_decay_rate 0.6561name module.module.external_feature_model.vit.decoder.layers.22.mlp.linear_fc1.bias lr_decay_rate 0.81name module.module.external_feature_model.vit.decoder.layers.5.self_attention.linear_qkv.weight lr_decay_rate 0.13508517176729928 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.ls1 key (0.0, 0.03486784401000001, False, False)name module.module.external_feature_model.vit.decoder.layers.23.ls2 lr_decay_rate 0.9_get_param_groups name module.module.decoder.layers.14.mlp.linear_fc1.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.8.mlp.linear_fc2.bias lr_decay_rate 0.18530201888518416 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.ls2 key (0.0, 0.012157665459056936, False, False) name module.module.external_feature_model.vit.decoder.layers.22.input_layernorm.weight lr_decay_rate 0.81 name module.module.external_feature_model.vit.decoder.layers.23.mlp.linear_fc1.bias lr_decay_rate 0.9 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.input_layernorm.weight key (0.0, 0.0729, False, False) _get_param_groups name module.module.external_feature_model.vision_projection.encoder.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.pre_mlp_layernorm.bias key (0.0, 0.08100000000000002, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.ls2 key (0.0, 0.06561, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.mlp.linear_fc2.bias key (0.0, 0.09000000000000001, False, False) _get_param_groups name module.module.decoder.layers.14.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.self_attention.linear_qkv.weight key (1.0, 0.013508517176729929, False, False)name module.module.external_feature_model.vit.decoder.layers.14.ls2 lr_decay_rate 0.3486784401000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.mlp.linear_fc1.bias key (0.0, 0.08100000000000002, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.ls2 key (0.0, 0.09000000000000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.input_layernorm.weight key (0.0, 0.08100000000000002, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.mlp.linear_fc2.bias key (0.0, 0.018530201888518418, False, False)name module.module.external_feature_model.vit.decoder.layers.13.self_attention.linear_proj.weight lr_decay_rate 0.31381059609000006 name module.module.external_feature_model.vit.decoder.layers.21.input_layernorm.bias lr_decay_rate 0.7290000000000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.mlp.linear_fc1.bias key (0.0, 0.09000000000000001, False, False) name module.module.external_feature_model.vit.decoder.layers.4.input_layernorm.weight lr_decay_rate 0.12157665459056935 name module.module.external_feature_model.vit.decoder.layers.22.mlp.linear_fc1.weight lr_decay_rate 0.81 _get_param_groups name module.module.external_feature_model.vision_projection.encoder.linear_fc2.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.20.input_layernorm.weight lr_decay_rate 0.6561_get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.self_attention.linear_proj.weight key (1.0, 0.031381059609000006, False, False) _get_param_groups name module.module.decoder.layers.15.input_layernorm.weight key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.5.self_attention.linear_qkv.bias lr_decay_rate 0.13508517176729928_get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.ls2 key (0.0, 0.03486784401000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.input_layernorm.bias key (0.0, 0.0729, False, False)_get_param_groups name module.module.external_feature_model.vision_projection.encoder.linear_fc1.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.22.mlp.linear_fc2.weight lr_decay_rate 0.81name module.module.external_feature_model.vit.decoder.layers.9.ls1 lr_decay_rate 0.20589113209464907_get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.mlp.linear_fc1.weight key (1.0, 0.08100000000000002, False, False) name module.module.external_feature_model.vit.decoder.layers.22.input_layernorm.bias lr_decay_rate 0.81name module.module.external_feature_model.vit.decoder.layers.23.input_layernorm.weight lr_decay_rate 0.9 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.input_layernorm.weight key (0.0, 0.012157665459056936, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.self_attention.linear_qkv.bias key (0.0, 0.013508517176729929, False, False)name module.module.external_feature_model.vit.decoder.layers.23.mlp.linear_fc2.weight lr_decay_rate 0.9 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.input_layernorm.weight key (0.0, 0.06561, False, False)_get_param_groups name module.module.external_feature_model.pre_proj_layernorm.weight key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.13.self_attention.linear_proj.bias lr_decay_rate 0.31381059609000006 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.ls1 key (0.0, 0.02058911320946491, False, False)_get_param_groups name module.module.decoder.layers.15.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.mlp.linear_fc2.weight key (1.0, 0.08100000000000002, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.input_layernorm.bias key (0.0, 0.08100000000000002, False, False)name module.module.external_feature_model.vit.decoder.layers.14.input_layernorm.weight lr_decay_rate 0.3486784401000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.mlp.linear_fc2.weight key (1.0, 0.09000000000000001, False, False)name module.module.external_feature_model.vit.decoder.layers.22.mlp.linear_fc1.bias lr_decay_rate 0.81_get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.input_layernorm.weight key (0.0, 0.09000000000000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.self_attention.linear_proj.bias key (0.0, 0.031381059609000006, False, False) _get_param_groups name module.module.external_feature_model.vision_projection.encoder.linear_fc2.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.21.self_attention.linear_proj.weight lr_decay_rate 0.7290000000000001name module.module.external_feature_model.vit.decoder.layers.4.input_layernorm.bias lr_decay_rate 0.12157665459056935 name module.module.external_feature_model.vit.decoder.layers.5.pre_mlp_layernorm.weight lr_decay_rate 0.13508517176729928 name module.module.external_feature_model.vit.decoder.layers.22.mlp.linear_fc2.bias lr_decay_rate 0.81_get_param_groups name module.module.decoder.layers.15.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.20.input_layernorm.bias lr_decay_rate 0.6561 _get_param_groups name module.module.external_feature_model.pre_proj_layernorm.bias key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.9.ls2 lr_decay_rate 0.20589113209464907 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.mlp.linear_fc1.bias key (0.0, 0.08100000000000002, False, False) name module.module.external_feature_model.vit.decoder.layers.23.input_layernorm.bias lr_decay_rate 0.9 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.input_layernorm.weight key (0.0, 0.03486784401000001, False, False) name module.module.external_feature_model.vit.decoder.layers.23.mlp.linear_fc2.bias lr_decay_rate 0.9_get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.mlp.linear_fc2.bias key (0.0, 0.08100000000000002, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.input_layernorm.bias key (0.0, 0.012157665459056936, False, False)_get_param_groups name module.module.decoder.layers.15.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.22.self_attention.linear_proj.weight lr_decay_rate 0.81name module.module.external_feature_model.vit.decoder.layers.13.self_attention.linear_qkv.weight lr_decay_rate 0.31381059609000006 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.self_attention.linear_proj.weight key (1.0, 0.0729, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.pre_mlp_layernorm.weight key (0.0, 0.013508517176729929, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.input_layernorm.bias key (0.0, 0.06561, False, False) _get_param_groups name module.module.external_feature_model.pre_proj_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.ls2 key (0.0, 0.02058911320946491, False, False)_get_param_groups name module.module.embedding.word_embeddings.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.input_layernorm.bias key (0.0, 0.09000000000000001, False, False)name module.module.external_feature_model.vit.decoder.layers.14.input_layernorm.bias lr_decay_rate 0.3486784401000001 name module.module.external_feature_model.vit.decoder.layers.22.mlp.linear_fc2.weight lr_decay_rate 0.81 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.mlp.linear_fc2.bias key (0.0, 0.09000000000000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.self_attention.linear_proj.weight key (1.0, 0.08100000000000002, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.self_attention.linear_qkv.weight key (1.0, 0.031381059609000006, False, False) name module.module.external_feature_model.vit.decoder.layers.5.pre_mlp_layernorm.bias lr_decay_rate 0.13508517176729928 name module.module.external_feature_model.vit.decoder.layers.23.ls1 lr_decay_rate 0.9 name module.module.external_feature_model.vit.decoder.layers.21.self_attention.linear_proj.bias lr_decay_rate 0.7290000000000001name module.module.external_feature_model.vit.decoder.layers.4.self_attention.linear_proj.weight lr_decay_rate 0.12157665459056935_get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.input_layernorm.bias key (0.0, 0.03486784401000001, False, False)_get_param_groups name module.module.decoder.layers.15.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.pre_proj_layernorm.bias key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.20.self_attention.linear_proj.weight lr_decay_rate 0.6561name module.module.external_feature_model.vit.decoder.layers.9.input_layernorm.weight lr_decay_rate 0.20589113209464907name module.module.external_feature_model.vit.decoder.layers.23.self_attention.linear_proj.weight lr_decay_rate 0.9 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.mlp.linear_fc2.weight key (1.0, 0.08100000000000002, False, False) name module.module.external_feature_model.vit.decoder.layers.22.self_attention.linear_proj.bias lr_decay_rate 0.81_get_param_groups name module.module.decoder.layers.0.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vision_projection.encoder.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.pre_mlp_layernorm.bias key (0.0, 0.013508517176729929, False, False)name module.module.external_feature_model.vit.decoder.layers.13.self_attention.linear_qkv.bias lr_decay_rate 0.31381059609000006 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.ls1 key (0.0, 0.09000000000000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.self_attention.linear_proj.bias key (0.0, 0.0729, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.self_attention.linear_proj.weight key (1.0, 0.012157665459056936, False, False)_get_param_groups name module.module.decoder.layers.15.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.input_layernorm.weight key (0.0, 0.02058911320946491, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.self_attention.linear_proj.weight key (1.0, 0.09000000000000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.self_attention.linear_proj.weight key (1.0, 0.06561, False, False) _get_param_groups name module.module.embedding.word_embeddings.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.14.self_attention.linear_proj.weight lr_decay_rate 0.3486784401000001 name module.module.external_feature_model.vit.decoder.layers.22.mlp.linear_fc2.bias lr_decay_rate 0.81_get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.self_attention.linear_proj.bias key (0.0, 0.08100000000000002, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.self_attention.linear_qkv.bias key (0.0, 0.031381059609000006, False, False)_get_param_groups name module.module.external_feature_model.vision_projection.encoder.linear_fc2.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.5.mlp.linear_fc1.weight lr_decay_rate 0.13508517176729928 name module.module.external_feature_model.vit.decoder.layers.23.ls2 lr_decay_rate 0.9 _get_param_groups name module.module.decoder.layers.0.self_attention.linear_proj.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.4.self_attention.linear_proj.bias lr_decay_rate 0.12157665459056935name module.module.external_feature_model.vit.decoder.layers.21.self_attention.linear_qkv.weight lr_decay_rate 0.7290000000000001_get_param_groups name module.module.decoder.layers.15.mlp.linear_fc2.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.20.self_attention.linear_proj.bias lr_decay_rate 0.6561 name module.module.external_feature_model.vit.decoder.layers.9.input_layernorm.bias lr_decay_rate 0.20589113209464907name module.module.external_feature_model.vit.decoder.layers.23.self_attention.linear_proj.bias lr_decay_rate 0.9 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.mlp.linear_fc2.bias key (0.0, 0.08100000000000002, False, False)name module.module.external_feature_model.vit.decoder.layers.22.self_attention.linear_qkv.weight lr_decay_rate 0.81_get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.self_attention.linear_proj.weight key (1.0, 0.03486784401000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.mlp.linear_fc1.weight key (1.0, 0.013508517176729929, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.ls2 key (0.0, 0.09000000000000001, False, False) _get_param_groups name module.module.decoder.layers.0.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.pre_proj_layernorm.weight key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.13.pre_mlp_layernorm.weight lr_decay_rate 0.31381059609000006 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.self_attention.linear_qkv.weight key (1.0, 0.0729, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.self_attention.linear_proj.bias key (0.0, 0.012157665459056936, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.self_attention.linear_proj.bias key (0.0, 0.09000000000000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.self_attention.linear_proj.bias key (0.0, 0.06561, False, False)_get_param_groups name module.module.decoder.layers.0.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.16.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.input_layernorm.bias key (0.0, 0.02058911320946491, False, False) name module.module.external_feature_model.vit.decoder.layers.14.self_attention.linear_proj.bias lr_decay_rate 0.3486784401000001_get_param_groups name module.module.external_feature_model.pre_proj_layernorm.bias key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.23.ls1 lr_decay_rate 0.9name module.module.external_feature_model.vit.decoder.layers.5.mlp.linear_fc1.bias lr_decay_rate 0.13508517176729928 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.self_attention.linear_qkv.weight key (1.0, 0.08100000000000002, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.pre_mlp_layernorm.weight key (0.0, 0.031381059609000006, False, False) name module.module.external_feature_model.vit.decoder.layers.23.input_layernorm.weight lr_decay_rate 0.9 name module.module.external_feature_model.vit.decoder.layers.20.self_attention.linear_qkv.weight lr_decay_rate 0.6561_get_param_groups name module.module.decoder.layers.0.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.23.self_attention.linear_qkv.weight lr_decay_rate 0.9 name module.module.external_feature_model.vit.decoder.layers.21.self_attention.linear_qkv.bias lr_decay_rate 0.7290000000000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.self_attention.linear_proj.bias key (0.0, 0.03486784401000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.mlp.linear_fc1.bias key (0.0, 0.013508517176729929, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.ls1 key (0.0, 0.09000000000000001, False, False)_get_param_groups name module.module.decoder.layers.16.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.0.self_attention.linear_proj.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.4.self_attention.linear_qkv.weight lr_decay_rate 0.12157665459056935 name module.module.external_feature_model.vit.decoder.layers.9.self_attention.linear_proj.weight lr_decay_rate 0.20589113209464907_get_param_groups name module.module.embedding.word_embeddings.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.22.self_attention.linear_qkv.bias lr_decay_rate 0.81 name module.module.external_feature_model.vit.decoder.layers.13.pre_mlp_layernorm.bias lr_decay_rate 0.31381059609000006 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.self_attention.linear_qkv.bias key (0.0, 0.0729, False, False)_get_param_groups name module.module.decoder.layers.0.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.self_attention.linear_qkv.weight key (1.0, 0.09000000000000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.input_layernorm.weight key (0.0, 0.09000000000000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.self_attention.linear_qkv.weight key (1.0, 0.06561, False, False) name module.module.external_feature_model.vit.decoder.layers.23.ls2 lr_decay_rate 0.9 name module.module.external_feature_model.vit.decoder.layers.14.self_attention.linear_qkv.weight lr_decay_rate 0.3486784401000001name module.module.external_feature_model.vit.decoder.layers.5.mlp.linear_fc2.weight lr_decay_rate 0.13508517176729928_get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.self_attention.linear_proj.weight key (1.0, 0.02058911320946491, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.self_attention.linear_qkv.bias key (0.0, 0.08100000000000002, False, False)_get_param_groups name module.module.decoder.layers.16.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.self_attention.linear_qkv.weight key (1.0, 0.012157665459056936, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.pre_mlp_layernorm.bias key (0.0, 0.031381059609000006, False, False) _get_param_groups name module.module.decoder.layers.0.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.23.input_layernorm.bias lr_decay_rate 0.9 _get_param_groups name module.module.decoder.layers.0.input_layernorm.weight key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.23.self_attention.linear_qkv.bias lr_decay_rate 0.9name module.module.external_feature_model.vit.decoder.layers.20.self_attention.linear_qkv.bias lr_decay_rate 0.6561 _get_param_groups name module.module.decoder.layers.0.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.ls2 key (0.0, 0.09000000000000001, False, False)name module.module.external_feature_model.vit.decoder.layers.4.self_attention.linear_qkv.bias lr_decay_rate 0.12157665459056935name module.module.external_feature_model.vit.decoder.layers.22.pre_mlp_layernorm.weight lr_decay_rate 0.81 _get_param_groups name module.module.decoder.layers.0.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.self_attention.linear_qkv.bias key (0.0, 0.06561, False, False)name module.module.external_feature_model.vit.decoder.layers.21.pre_mlp_layernorm.weight lr_decay_rate 0.7290000000000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.self_attention.linear_qkv.weight key (1.0, 0.03486784401000001, False, False)_get_param_groups name module.module.decoder.layers.16.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.mlp.linear_fc2.weight key (1.0, 0.013508517176729929, False, False) _get_param_groups name module.module.decoder.layers.0.self_attention.linear_proj.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.9.self_attention.linear_proj.bias lr_decay_rate 0.20589113209464907 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.input_layernorm.bias key (0.0, 0.09000000000000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.pre_mlp_layernorm.weight key (0.0, 0.08100000000000002, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.self_attention.linear_qkv.bias key (0.0, 0.09000000000000001, False, False) name module.module.external_feature_model.vit.decoder.layers.13.mlp.linear_fc1.weight lr_decay_rate 0.31381059609000006 _get_param_groups name module.module.decoder.layers.0.mlp.linear_fc2.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.23.input_layernorm.weight lr_decay_rate 0.9 _get_param_groups name module.module.decoder.layers.0.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.5.mlp.linear_fc2.bias lr_decay_rate 0.13508517176729928_get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.self_attention.linear_qkv.bias key (0.0, 0.012157665459056936, False, False)name module.module.external_feature_model.vit.decoder.layers.22.pre_mlp_layernorm.bias lr_decay_rate 0.81_get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.pre_mlp_layernorm.weight key (0.0, 0.0729, False, False) name module.module.external_feature_model.vit.decoder.layers.14.self_attention.linear_qkv.bias lr_decay_rate 0.3486784401000001_get_param_groups name module.module.decoder.layers.0.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.self_attention.linear_proj.bias key (0.0, 0.02058911320946491, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.input_layernorm.weight key (0.0, 0.09000000000000001, False, False)name module.module.external_feature_model.vit.decoder.layers.20.pre_mlp_layernorm.weight lr_decay_rate 0.6561_get_param_groups name module.module.decoder.layers.16.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.23.self_attention.linear_proj.weight lr_decay_rate 0.9 name module.module.external_feature_model.vit.decoder.layers.23.pre_mlp_layernorm.weight lr_decay_rate 0.9 _get_param_groups name module.module.decoder.layers.1.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.mlp.linear_fc1.weight key (1.0, 0.031381059609000006, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.pre_mlp_layernorm.bias key (0.0, 0.08100000000000002, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.mlp.linear_fc2.bias key (0.0, 0.013508517176729929, False, False)name module.module.external_feature_model.vit.decoder.layers.4.pre_mlp_layernorm.weight lr_decay_rate 0.12157665459056935 _get_param_groups name module.module.decoder.layers.0.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.21.pre_mlp_layernorm.bias lr_decay_rate 0.7290000000000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.self_attention.linear_proj.weight key (1.0, 0.09000000000000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.self_attention.linear_qkv.bias key (0.0, 0.03486784401000001, False, False) _get_param_groups name module.module.decoder.layers.16.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.0.mlp.linear_fc1.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.23.input_layernorm.bias lr_decay_rate 0.9_get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.pre_mlp_layernorm.weight key (0.0, 0.06561, False, False) name module.module.external_feature_model.vit.decoder.layers.9.self_attention.linear_qkv.weight lr_decay_rate 0.20589113209464907_get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.pre_mlp_layernorm.weight key (0.0, 0.09000000000000001, False, False) _get_param_groups name module.module.decoder.layers.1.self_attention.linear_proj.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.13.mlp.linear_fc1.bias lr_decay_rate 0.31381059609000006 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.pre_mlp_layernorm.weight key (0.0, 0.012157665459056936, False, False)name module.module.external_feature_model.vit.decoder.layers.6.ls1 lr_decay_rate 0.15009463529699918 name module.module.external_feature_model.vit.decoder.layers.22.mlp.linear_fc1.weight lr_decay_rate 0.81_get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.pre_mlp_layernorm.bias key (0.0, 0.0729, False, False) name module.module.external_feature_model.vit.decoder.layers.23.self_attention.linear_proj.bias lr_decay_rate 0.9 _get_param_groups name module.module.decoder.layers.0.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.16.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.input_layernorm.bias key (0.0, 0.09000000000000001, False, False)_get_param_groups name module.module.decoder.layers.0.mlp.linear_fc2.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.23.pre_mlp_layernorm.bias lr_decay_rate 0.9name module.module.external_feature_model.vit.decoder.layers.14.pre_mlp_layernorm.weight lr_decay_rate 0.3486784401000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.mlp.linear_fc1.bias key (0.0, 0.031381059609000006, False, False)_get_param_groups name module.module.decoder.layers.1.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.20.pre_mlp_layernorm.bias lr_decay_rate 0.6561_get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.self_attention.linear_qkv.weight key (1.0, 0.02058911320946491, False, False)name module.module.external_feature_model.vit.decoder.layers.4.pre_mlp_layernorm.bias lr_decay_rate 0.12157665459056935 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.mlp.linear_fc1.weight key (1.0, 0.08100000000000002, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.ls1 key (0.0, 0.015009463529699918, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.self_attention.linear_proj.bias key (0.0, 0.09000000000000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.pre_mlp_layernorm.bias key (0.0, 0.09000000000000001, False, False)name module.module.external_feature_model.vit.decoder.layers.21.mlp.linear_fc1.weight lr_decay_rate 0.7290000000000001name module.module.external_feature_model.vit.decoder.layers.23.self_attention.linear_proj.weight lr_decay_rate 0.9 _get_param_groups name module.module.decoder.layers.0.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.pre_mlp_layernorm.weight key (0.0, 0.03486784401000001, False, False) _get_param_groups name module.module.decoder.layers.17.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.pre_mlp_layernorm.bias key (0.0, 0.012157665459056936, False, False)_get_param_groups name module.module.decoder.layers.1.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.pre_mlp_layernorm.bias key (0.0, 0.06561, False, False)name module.module.external_feature_model.vit.decoder.layers.9.self_attention.linear_qkv.bias lr_decay_rate 0.20589113209464907_get_param_groups name module.module.decoder.layers.1.input_layernorm.weight key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.13.mlp.linear_fc2.weight lr_decay_rate 0.31381059609000006 name module.module.external_feature_model.vit.decoder.layers.23.self_attention.linear_qkv.weight lr_decay_rate 0.9 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.self_attention.linear_proj.weight key (1.0, 0.09000000000000001, False, False)name module.module.external_feature_model.vit.decoder.layers.6.ls2 lr_decay_rate 0.15009463529699918 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.mlp.linear_fc1.weight key (1.0, 0.0729, False, False) name module.module.external_feature_model.vit.decoder.layers.22.mlp.linear_fc1.bias lr_decay_rate 0.81 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.self_attention.linear_qkv.bias key (0.0, 0.02058911320946491, False, False) _get_param_groups name module.module.decoder.layers.0.mlp.linear_fc2.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.23.mlp.linear_fc1.weight lr_decay_rate 0.9 name module.module.external_feature_model.vit.decoder.layers.14.pre_mlp_layernorm.bias lr_decay_rate 0.3486784401000001 _get_param_groups name module.module.decoder.layers.1.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.ls2 key (0.0, 0.015009463529699918, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.mlp.linear_fc2.weight key (1.0, 0.031381059609000006, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.self_attention.linear_qkv.weight key (1.0, 0.09000000000000001, False, False) _get_param_groups name module.module.decoder.layers.17.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.1.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.20.mlp.linear_fc1.weight lr_decay_rate 0.6561name module.module.external_feature_model.vit.decoder.layers.4.mlp.linear_fc1.weight lr_decay_rate 0.12157665459056935_get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.mlp.linear_fc1.bias key (0.0, 0.08100000000000002, False, False) name module.module.external_feature_model.vit.decoder.layers.23.self_attention.linear_proj.bias lr_decay_rate 0.9name module.module.external_feature_model.vit.decoder.layers.21.mlp.linear_fc1.bias lr_decay_rate 0.7290000000000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.mlp.linear_fc1.weight key (1.0, 0.09000000000000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.pre_mlp_layernorm.bias key (0.0, 0.03486784401000001, False, False)name module.module.external_feature_model.vit.decoder.layers.9.pre_mlp_layernorm.weight lr_decay_rate 0.20589113209464907 name module.module.external_feature_model.vit.decoder.layers.6.input_layernorm.weight lr_decay_rate 0.15009463529699918_get_param_groups name module.module.decoder.layers.1.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.1.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.13.mlp.linear_fc2.bias lr_decay_rate 0.31381059609000006 name module.module.external_feature_model.vit.decoder.layers.23.self_attention.linear_qkv.bias lr_decay_rate 0.9 name module.module.external_feature_model.vit.decoder.layers.23.mlp.linear_fc1.bias lr_decay_rate 0.9 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.mlp.linear_fc1.weight key (1.0, 0.012157665459056936, False, False)_get_param_groups name module.module.decoder.layers.17.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.mlp.linear_fc1.bias key (0.0, 0.0729, False, False) name module.module.external_feature_model.vit.decoder.layers.22.mlp.linear_fc2.weight lr_decay_rate 0.81_get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.mlp.linear_fc1.weight key (1.0, 0.06561, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.self_attention.linear_proj.bias key (0.0, 0.09000000000000001, False, False)_get_param_groups name module.module.decoder.layers.1.mlp.linear_fc1.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.14.mlp.linear_fc1.weight lr_decay_rate 0.3486784401000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.pre_mlp_layernorm.weight key (0.0, 0.02058911320946491, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.input_layernorm.weight key (0.0, 0.015009463529699918, False, False)_get_param_groups name module.module.decoder.layers.1.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.mlp.linear_fc2.bias key (0.0, 0.031381059609000006, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.mlp.linear_fc1.bias key (0.0, 0.09000000000000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.self_attention.linear_qkv.bias key (0.0, 0.09000000000000001, False, False) _get_param_groups name module.module.decoder.layers.17.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.1.self_attention.linear_proj.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.4.mlp.linear_fc1.bias lr_decay_rate 0.12157665459056935_get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.mlp.linear_fc2.weight key (1.0, 0.08100000000000002, False, False) name module.module.external_feature_model.vit.decoder.layers.21.mlp.linear_fc2.weight lr_decay_rate 0.7290000000000001name module.module.external_feature_model.vit.decoder.layers.20.mlp.linear_fc1.bias lr_decay_rate 0.6561 name module.module.external_feature_model.vit.decoder.layers.14.ls1 lr_decay_rate 0.3486784401000001 name module.module.external_feature_model.vit.decoder.layers.23.self_attention.linear_qkv.weight lr_decay_rate 0.9_get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.mlp.linear_fc1.weight key (1.0, 0.03486784401000001, False, False)_get_param_groups name module.module.decoder.layers.1.mlp.linear_fc2.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.9.pre_mlp_layernorm.bias lr_decay_rate 0.20589113209464907_get_param_groups name module.module.decoder.layers.1.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.6.input_layernorm.bias lr_decay_rate 0.15009463529699918 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.mlp.linear_fc2.weight key (1.0, 0.0729, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.mlp.linear_fc1.bias key (0.0, 0.012157665459056936, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.mlp.linear_fc1.bias key (0.0, 0.06561, False, False) _get_param_groups name module.module.decoder.layers.17.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.23.mlp.linear_fc2.weight lr_decay_rate 0.9 _get_param_groups name module.module.decoder.layers.1.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.23.pre_mlp_layernorm.weight lr_decay_rate 0.9name module.module.external_feature_model.vit.decoder.layers.22.mlp.linear_fc2.bias lr_decay_rate 0.81 _get_param_groups name module.module.decoder.layers.2.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.ls1 key (0.0, 0.03486784401000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.input_layernorm.bias key (0.0, 0.015009463529699918, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.self_attention.linear_qkv.weight key (1.0, 0.09000000000000001, False, False)name module.module.external_feature_model.vit.decoder.layers.21.mlp.linear_fc2.bias lr_decay_rate 0.7290000000000001 name module.module.external_feature_model.vit.decoder.layers.4.mlp.linear_fc2.weight lr_decay_rate 0.12157665459056935 name module.module.external_feature_model.vit.decoder.layers.20.mlp.linear_fc2.weight lr_decay_rate 0.6561_get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.pre_mlp_layernorm.bias key (0.0, 0.02058911320946491, False, False) name module.module.external_feature_model.vit.decoder.layers.14.mlp.linear_fc1.bias lr_decay_rate 0.3486784401000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.mlp.linear_fc2.weight key (1.0, 0.09000000000000001, False, False) _get_param_groups name module.module.decoder.layers.1.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.17.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.mlp.linear_fc2.bias key (0.0, 0.08100000000000002, False, False) _get_param_groups name module.module.decoder.layers.1.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.pre_mlp_layernorm.weight key (0.0, 0.09000000000000001, False, False)name module.module.external_feature_model.vit.decoder.layers.6.self_attention.linear_proj.weight lr_decay_rate 0.15009463529699918_get_param_groups name module.module.decoder.layers.2.self_attention.linear_proj.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.14.ls2 lr_decay_rate 0.3486784401000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.mlp.linear_fc2.bias key (0.0, 0.0729, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.mlp.linear_fc2.weight key (1.0, 0.06561, False, False) name module.module.external_feature_model.vit.decoder.layers.23.self_attention.linear_qkv.bias lr_decay_rate 0.9name module.module.external_feature_model.vit.decoder.layers.9.mlp.linear_fc1.weight lr_decay_rate 0.20589113209464907_get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.mlp.linear_fc1.bias key (0.0, 0.03486784401000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.mlp.linear_fc2.weight key (1.0, 0.012157665459056936, False, False) _get_param_groups name module.module.decoder.layers.2.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.1.mlp.linear_fc2.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.23.ls1 lr_decay_rate 0.9 _get_param_groups name module.module.decoder.layers.1.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.23.pre_mlp_layernorm.bias lr_decay_rate 0.9 name module.module.external_feature_model.vit.decoder.layers.23.mlp.linear_fc2.bias lr_decay_rate 0.9 _get_param_groups name module.module.decoder.layers.17.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.mlp.linear_fc1.weight key (1.0, 0.02058911320946491, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.ls1 key (0.0, 0.09000000000000001, False, False)name module.module.external_feature_model.vit.decoder.layers.14.mlp.linear_fc2.weight lr_decay_rate 0.3486784401000001_get_param_groups name module.module.decoder.layers.2.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.self_attention.linear_proj.weight key (1.0, 0.015009463529699918, False, False) name module.module.external_feature_model.vit.decoder.layers.22.ls1 lr_decay_rate 0.81 _get_param_groups name module.module.decoder.layers.2.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.self_attention.linear_qkv.bias key (0.0, 0.09000000000000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.pre_mlp_layernorm.bias key (0.0, 0.09000000000000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.ls2 key (0.0, 0.03486784401000001, False, False)name module.module.external_feature_model.vit.decoder.layers.20.mlp.linear_fc2.bias lr_decay_rate 0.6561name module.module.external_feature_model.vit.decoder.layers.4.mlp.linear_fc2.bias lr_decay_rate 0.12157665459056935 _get_param_groups name module.module.decoder.layers.1.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.mlp.linear_fc2.weight key (1.0, 0.03486784401000001, False, False)name module.module.external_feature_model.vit.decoder.layers.23.ls2 lr_decay_rate 0.9_get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.mlp.linear_fc2.bias key (0.0, 0.09000000000000001, False, False) name module.module.external_feature_model.vit.decoder.layers.6.self_attention.linear_proj.bias lr_decay_rate 0.15009463529699918 name module.module.external_feature_model.vit.decoder.layers.9.mlp.linear_fc1.bias lr_decay_rate 0.20589113209464907_get_param_groups name module.module.decoder.layers.18.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.ls1 key (0.0, 0.08100000000000002, False, False)_get_param_groups name module.module.decoder.layers.2.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.2.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.ls2 key (0.0, 0.09000000000000001, False, False) name module.module.external_feature_model.vit.decoder.layers.23.mlp.linear_fc1.weight lr_decay_rate 0.9_get_param_groups name module.module.decoder.layers.1.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.mlp.linear_fc2.bias key (0.0, 0.06561, False, False)name module.module.external_feature_model.vit.decoder.layers.23.pre_mlp_layernorm.weight lr_decay_rate 0.9_get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.mlp.linear_fc2.bias key (0.0, 0.012157665459056936, False, False) name module.module.external_feature_model.vit.decoder.layers.14.mlp.linear_fc2.bias lr_decay_rate 0.3486784401000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.mlp.linear_fc1.bias key (0.0, 0.02058911320946491, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.self_attention.linear_proj.bias key (0.0, 0.015009463529699918, False, False) name module.module.external_feature_model.vit.decoder.layers.14.input_layernorm.weight lr_decay_rate 0.3486784401000001 _get_param_groups name module.module.decoder.layers.18.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.2.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vision_projection.encoder.linear_fc1.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.22.ls2 lr_decay_rate 0.81_get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.mlp.linear_fc1.weight key (1.0, 0.09000000000000001, False, False)name module.module.external_feature_model.vit.decoder.layers.23.input_layernorm.weight lr_decay_rate 0.9 _get_param_groups name module.module.decoder.layers.2.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.pre_mlp_layernorm.weight key (0.0, 0.09000000000000001, False, False) _get_param_groups name module.module.decoder.layers.2.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.mlp.linear_fc2.bias key (0.0, 0.03486784401000001, False, False)name module.module.external_feature_model.vit.decoder.layers.9.mlp.linear_fc2.weight lr_decay_rate 0.20589113209464907 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.input_layernorm.weight key (0.0, 0.03486784401000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.ls2 key (0.0, 0.08100000000000002, False, False)name module.module.external_feature_model.vit.decoder.layers.6.self_attention.linear_qkv.weight lr_decay_rate 0.15009463529699918name module.module.external_feature_model.vit.decoder.layers.21.ls1 lr_decay_rate 0.7290000000000001name module.module.external_feature_model.vit.decoder.layers.5.ls1 lr_decay_rate 0.13508517176729928_get_param_groups name module.module.decoder.layers.2.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.18.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.input_layernorm.weight key (0.0, 0.09000000000000001, False, False)name module.module.external_feature_model.vit.decoder.layers.23.mlp.linear_fc1.bias lr_decay_rate 0.9 _get_param_groups name module.module.external_feature_model.vision_projection.encoder.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.2.mlp.linear_fc2.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.23.pre_mlp_layernorm.bias lr_decay_rate 0.9 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.mlp.linear_fc2.weight key (1.0, 0.02058911320946491, False, False)name module.module.external_feature_model.vit.decoder.layers.15.ls1 lr_decay_rate 0.3874204890000001 _get_param_groups name module.module.decoder.layers.2.self_attention.linear_proj.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.22.input_layernorm.weight lr_decay_rate 0.81_get_param_groups name module.module.decoder.layers.2.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.14.input_layernorm.bias lr_decay_rate 0.3486784401000001_get_param_groups name module.module.decoder.layers.18.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.self_attention.linear_qkv.weight key (1.0, 0.015009463529699918, False, False) name module.module.external_feature_model.vit.decoder.layers.23.input_layernorm.bias lr_decay_rate 0.9_get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.ls1 key (0.0, 0.0729, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.ls1 key (0.0, 0.013508517176729929, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.mlp.linear_fc1.bias key (0.0, 0.09000000000000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.pre_mlp_layernorm.bias key (0.0, 0.09000000000000001, False, False) _get_param_groups name module.module.decoder.layers.3.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.pre_proj_layernorm.weight key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.9.mlp.linear_fc2.bias lr_decay_rate 0.20589113209464907 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.ls1 key (0.0, 0.03874204890000001, False, False) _get_param_groups name module.module.decoder.layers.2.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.input_layernorm.bias key (0.0, 0.09000000000000001, False, False)_get_param_groups name module.module.decoder.layers.2.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.input_layernorm.weight key (0.0, 0.08100000000000002, False, False)_get_param_groups name module.module.decoder.layers.18.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.21.ls2 lr_decay_rate 0.7290000000000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.input_layernorm.bias key (0.0, 0.03486784401000001, False, False)name module.module.external_feature_model.vit.decoder.layers.6.self_attention.linear_qkv.bias lr_decay_rate 0.15009463529699918 name module.module.external_feature_model.vit.decoder.layers.5.ls2 lr_decay_rate 0.13508517176729928 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.mlp.linear_fc2.bias key (0.0, 0.02058911320946491, False, False)name module.module.external_feature_model.vit.decoder.layers.23.mlp.linear_fc2.weight lr_decay_rate 0.9 _get_param_groups name module.module.external_feature_model.pre_proj_layernorm.bias key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.23.mlp.linear_fc1.weight lr_decay_rate 0.9 _get_param_groups name module.module.decoder.layers.2.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.15.ls2 lr_decay_rate 0.3874204890000001 _get_param_groups name module.module.decoder.layers.3.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.ls2 key (0.0, 0.0729, False, False)_get_param_groups name module.module.decoder.layers.18.mlp.linear_fc1.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.22.input_layernorm.bias lr_decay_rate 0.81 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.self_attention.linear_qkv.bias key (0.0, 0.015009463529699918, False, False) _get_param_groups name module.module.decoder.layers.2.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.ls2 key (0.0, 0.013508517176729929, False, False) name module.module.external_feature_model.vit.decoder.layers.23.self_attention.linear_proj.weight lr_decay_rate 0.9 name module.module.external_feature_model.vit.decoder.layers.14.self_attention.linear_proj.weight lr_decay_rate 0.3486784401000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.input_layernorm.bias key (0.0, 0.08100000000000002, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.mlp.linear_fc2.weight key (1.0, 0.09000000000000001, False, False) _get_param_groups name module.module.embedding.word_embeddings.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.10.ls1 lr_decay_rate 0.2287679245496101 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.mlp.linear_fc1.weight key (1.0, 0.09000000000000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.ls2 key (0.0, 0.03874204890000001, False, False) _get_param_groups name module.module.decoder.layers.3.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.2.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.3.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.18.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.self_attention.linear_proj.weight key (1.0, 0.09000000000000001, False, False)name module.module.external_feature_model.vit.decoder.layers.21.input_layernorm.weight lr_decay_rate 0.7290000000000001name module.module.external_feature_model.vit.decoder.layers.5.input_layernorm.weight lr_decay_rate 0.13508517176729928 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.self_attention.linear_proj.weight key (1.0, 0.03486784401000001, False, False)name module.module.external_feature_model.vit.decoder.layers.23.mlp.linear_fc2.bias lr_decay_rate 0.9 name module.module.external_feature_model.vit.decoder.layers.6.pre_mlp_layernorm.weight lr_decay_rate 0.15009463529699918_get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.ls1 key (0.0, 0.02287679245496101, False, False)name module.module.external_feature_model.vit.decoder.layers.22.self_attention.linear_proj.weight lr_decay_rate 0.81 name module.module.external_feature_model.vit.decoder.layers.15.input_layernorm.weight lr_decay_rate 0.3874204890000001_get_param_groups name module.module.decoder.layers.3.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.19.input_layernorm.weight key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.23.mlp.linear_fc1.bias lr_decay_rate 0.9 _get_param_groups name module.module.decoder.layers.2.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.input_layernorm.weight key (0.0, 0.0729, False, False) _get_param_groups name module.module.decoder.layers.0.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.input_layernorm.weight key (0.0, 0.013508517176729929, False, False) _get_param_groups name module.module.decoder.layers.3.self_attention.linear_proj.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.23.self_attention.linear_proj.bias lr_decay_rate 0.9_get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.pre_mlp_layernorm.weight key (0.0, 0.015009463529699918, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.mlp.linear_fc2.bias key (0.0, 0.09000000000000001, False, False) name module.module.external_feature_model.vit.decoder.layers.14.self_attention.linear_proj.bias lr_decay_rate 0.3486784401000001 name module.module.external_feature_model.vit.decoder.layers.10.ls2 lr_decay_rate 0.2287679245496101_get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.input_layernorm.weight key (0.0, 0.03874204890000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.self_attention.linear_proj.weight key (1.0, 0.08100000000000002, False, False) _get_param_groups name module.module.decoder.layers.2.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.mlp.linear_fc1.bias key (0.0, 0.09000000000000001, False, False) _get_param_groups name module.module.decoder.layers.3.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.19.self_attention.linear_proj.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.21.input_layernorm.bias lr_decay_rate 0.7290000000000001 name module.module.external_feature_model.vit.decoder.layers.5.input_layernorm.bias lr_decay_rate 0.13508517176729928_get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.self_attention.linear_proj.bias key (0.0, 0.09000000000000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.ls2 key (0.0, 0.02287679245496101, False, False)_get_param_groups name module.module.decoder.layers.3.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.0.self_attention.linear_proj.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.6.pre_mlp_layernorm.bias lr_decay_rate 0.15009463529699918 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.self_attention.linear_proj.bias key (0.0, 0.03486784401000001, False, False) _get_param_groups name module.module.external_feature_model.vision_projection.encoder.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.19.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.3.mlp.linear_fc1.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.15.input_layernorm.bias lr_decay_rate 0.3874204890000001name module.module.external_feature_model.vit.decoder.layers.22.self_attention.linear_proj.bias lr_decay_rate 0.81 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.input_layernorm.bias key (0.0, 0.0729, False, False)_get_param_groups name module.module.decoder.layers.3.input_layernorm.weight key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.23.mlp.linear_fc2.weight lr_decay_rate 0.9 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.pre_mlp_layernorm.bias key (0.0, 0.015009463529699918, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.input_layernorm.bias key (0.0, 0.013508517176729929, False, False) _get_param_groups name module.module.decoder.layers.0.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.23.self_attention.linear_qkv.weight lr_decay_rate 0.9 _get_param_groups name module.module.decoder.layers.3.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.10.input_layernorm.weight lr_decay_rate 0.2287679245496101 _get_param_groups name module.module.external_feature_model.vision_projection.encoder.linear_fc2.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.14.self_attention.linear_qkv.weight lr_decay_rate 0.3486784401000001_get_param_groups name module.module.decoder.layers.3.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.19.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.input_layernorm.bias key (0.0, 0.03874204890000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.self_attention.linear_proj.bias key (0.0, 0.08100000000000002, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.mlp.linear_fc2.weight key (1.0, 0.09000000000000001, False, False) _get_param_groups name module.module.decoder.layers.0.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.3.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.input_layernorm.weight key (0.0, 0.02287679245496101, False, False)name module.module.external_feature_model.vit.decoder.layers.21.self_attention.linear_proj.weight lr_decay_rate 0.7290000000000001name module.module.external_feature_model.vit.decoder.layers.6.mlp.linear_fc1.weight lr_decay_rate 0.15009463529699918_get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.self_attention.linear_qkv.weight key (1.0, 0.09000000000000001, False, False) _get_param_groups name module.module.decoder.layers.3.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.5.self_attention.linear_proj.weight lr_decay_rate 0.13508517176729928 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.self_attention.linear_qkv.weight key (1.0, 0.03486784401000001, False, False) name module.module.external_feature_model.vit.decoder.layers.15.self_attention.linear_proj.weight lr_decay_rate 0.3874204890000001_get_param_groups name module.module.external_feature_model.pre_proj_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.4.input_layernorm.weight key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.23.mlp.linear_fc2.bias lr_decay_rate 0.9 _get_param_groups name module.module.decoder.layers.0.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.3.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.22.self_attention.linear_qkv.weight lr_decay_rate 0.81 name module.module.external_feature_model.vit.decoder.layers.23.self_attention.linear_qkv.bias lr_decay_rate 0.9_get_param_groups name module.module.decoder.layers.19.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.10.input_layernorm.bias lr_decay_rate 0.2287679245496101 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.self_attention.linear_proj.weight key (1.0, 0.013508517176729929, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.mlp.linear_fc1.weight key (1.0, 0.015009463529699918, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.self_attention.linear_proj.weight key (1.0, 0.0729, False, False)_get_param_groups name module.module.decoder.layers.3.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.self_attention.linear_qkv.bias key (0.0, 0.09000000000000001, False, False) name module.module.external_feature_model.vit.decoder.layers.14.self_attention.linear_qkv.bias lr_decay_rate 0.3486784401000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.mlp.linear_fc2.bias key (0.0, 0.09000000000000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.self_attention.linear_proj.weight key (1.0, 0.03874204890000001, False, False) _get_param_groups name module.module.decoder.layers.4.self_attention.linear_proj.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.6.mlp.linear_fc1.bias lr_decay_rate 0.15009463529699918 _get_param_groups name module.module.external_feature_model.pre_proj_layernorm.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.input_layernorm.bias key (0.0, 0.02287679245496101, False, False)_get_param_groups name module.module.decoder.layers.19.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.self_attention.linear_qkv.weight key (1.0, 0.08100000000000002, False, False) _get_param_groups name module.module.decoder.layers.0.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.3.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.self_attention.linear_qkv.bias key (0.0, 0.03486784401000001, False, False) _get_param_groups name module.module.decoder.layers.3.mlp.linear_fc2.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.21.self_attention.linear_proj.bias lr_decay_rate 0.7290000000000001name module.module.external_feature_model.vit.decoder.layers.5.self_attention.linear_proj.bias lr_decay_rate 0.13508517176729928name module.module.external_feature_model.vit.decoder.layers.15.self_attention.linear_proj.bias lr_decay_rate 0.3874204890000001 _get_param_groups name module.module.external_feature_model.vision_projection.encoder.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.mlp.linear_fc1.bias key (0.0, 0.015009463529699918, False, False)name module.module.external_feature_model.vit.decoder.layers.23.pre_mlp_layernorm.weight lr_decay_rate 0.9 _get_param_groups name module.module.decoder.layers.4.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.19.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.0.mlp.linear_fc2.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.22.self_attention.linear_qkv.bias lr_decay_rate 0.81 _get_param_groups name module.module.decoder.layers.3.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.10.self_attention.linear_proj.weight lr_decay_rate 0.2287679245496101name module.module.external_feature_model.vit.decoder.layers.14.pre_mlp_layernorm.weight lr_decay_rate 0.3486784401000001_get_param_groups name module.module.embedding.word_embeddings.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.6.mlp.linear_fc2.weight lr_decay_rate 0.15009463529699918_get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.self_attention.linear_proj.bias key (0.0, 0.0729, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.self_attention.linear_proj.bias key (0.0, 0.03874204890000001, False, False) _get_param_groups name module.module.decoder.layers.4.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.self_attention.linear_proj.bias key (0.0, 0.013508517176729929, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.pre_mlp_layernorm.weight key (0.0, 0.09000000000000001, False, False) _get_param_groups name module.module.decoder.layers.4.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vision_projection.encoder.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.20.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.self_attention.linear_proj.weight key (1.0, 0.02287679245496101, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.self_attention.linear_qkv.bias key (0.0, 0.08100000000000002, False, False)_get_param_groups name module.module.decoder.layers.1.input_layernorm.weight key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.21.self_attention.linear_qkv.weight lr_decay_rate 0.7290000000000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.pre_mlp_layernorm.weight key (0.0, 0.03486784401000001, False, False)_get_param_groups name module.module.decoder.layers.3.mlp.linear_fc1.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.23.pre_mlp_layernorm.bias lr_decay_rate 0.9 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.mlp.linear_fc2.weight key (1.0, 0.015009463529699918, False, False) name module.module.external_feature_model.vit.decoder.layers.15.self_attention.linear_qkv.weight lr_decay_rate 0.3874204890000001 _get_param_groups name module.module.decoder.layers.0.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.4.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.4.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.pre_proj_layernorm.weight key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.5.self_attention.linear_qkv.weight lr_decay_rate 0.13508517176729928_get_param_groups name module.module.decoder.layers.20.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.pre_mlp_layernorm.bias key (0.0, 0.09000000000000001, False, False) name module.module.external_feature_model.vit.decoder.layers.10.self_attention.linear_proj.bias lr_decay_rate 0.2287679245496101 name module.module.external_feature_model.vit.decoder.layers.6.mlp.linear_fc2.bias lr_decay_rate 0.15009463529699918name module.module.external_feature_model.vit.decoder.layers.14.pre_mlp_layernorm.bias lr_decay_rate 0.3486784401000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.self_attention.linear_qkv.weight key (1.0, 0.0729, False, False)_get_param_groups name module.module.decoder.layers.3.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.1.self_attention.linear_proj.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.22.pre_mlp_layernorm.weight lr_decay_rate 0.81_get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.self_attention.linear_qkv.weight key (1.0, 0.03874204890000001, False, False) _get_param_groups name module.module.decoder.layers.4.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.0.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.pre_proj_layernorm.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.4.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.self_attention.linear_qkv.weight key (1.0, 0.013508517176729929, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.self_attention.linear_proj.bias key (0.0, 0.02287679245496101, False, False) _get_param_groups name module.module.decoder.layers.20.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.mlp.linear_fc2.bias key (0.0, 0.015009463529699918, False, False) name module.module.external_feature_model.vit.decoder.layers.23.mlp.linear_fc1.weight lr_decay_rate 0.9name module.module.external_feature_model.vit.decoder.layers.21.self_attention.linear_qkv.bias lr_decay_rate 0.7290000000000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.pre_mlp_layernorm.bias key (0.0, 0.03486784401000001, False, False) _get_param_groups name module.module.decoder.layers.1.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.pre_mlp_layernorm.weight key (0.0, 0.08100000000000002, False, False)_get_param_groups name module.module.decoder.layers.4.input_layernorm.weight key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.15.self_attention.linear_qkv.bias lr_decay_rate 0.3874204890000001_get_param_groups name module.module.decoder.layers.4.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.4.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.embedding.word_embeddings.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.0.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.self_attention.linear_qkv.bias key (0.0, 0.0729, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.mlp.linear_fc1.weight key (1.0, 0.09000000000000001, False, False)_get_param_groups name module.module.decoder.layers.20.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.5.self_attention.linear_qkv.bias lr_decay_rate 0.13508517176729928 name module.module.external_feature_model.vit.decoder.layers.10.self_attention.linear_qkv.weight lr_decay_rate 0.2287679245496101 name module.module.external_feature_model.vit.decoder.layers.7.ls1 lr_decay_rate 0.16677181699666577_get_param_groups name module.module.decoder.layers.1.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.self_attention.linear_qkv.bias key (0.0, 0.03874204890000001, False, False)name module.module.external_feature_model.vit.decoder.layers.14.mlp.linear_fc1.weight lr_decay_rate 0.3486784401000001 _get_param_groups name module.module.decoder.layers.5.input_layernorm.weight key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.22.pre_mlp_layernorm.bias lr_decay_rate 0.81 _get_param_groups name module.module.decoder.layers.4.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.4.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.0.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.0.input_layernorm.weight key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.23.mlp.linear_fc1.bias lr_decay_rate 0.9_get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.self_attention.linear_qkv.bias key (0.0, 0.013508517176729929, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.ls1 key (0.0, 0.016677181699666577, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.self_attention.linear_qkv.weight key (1.0, 0.02287679245496101, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.mlp.linear_fc1.weight key (1.0, 0.03486784401000001, False, False)_get_param_groups name module.module.decoder.layers.20.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.21.pre_mlp_layernorm.weight lr_decay_rate 0.7290000000000001 _get_param_groups name module.module.decoder.layers.1.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.5.self_attention.linear_proj.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.15.pre_mlp_layernorm.weight lr_decay_rate 0.3874204890000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.pre_mlp_layernorm.bias key (0.0, 0.08100000000000002, False, False) _get_param_groups name module.module.decoder.layers.4.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.4.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.mlp.linear_fc1.bias key (0.0, 0.09000000000000001, False, False) _get_param_groups name module.module.decoder.layers.0.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.7.ls2 lr_decay_rate 0.16677181699666577_get_param_groups name module.module.decoder.layers.0.self_attention.linear_proj.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.10.self_attention.linear_qkv.bias lr_decay_rate 0.2287679245496101name module.module.external_feature_model.vit.decoder.layers.14.mlp.linear_fc1.bias lr_decay_rate 0.3486784401000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.pre_mlp_layernorm.weight key (0.0, 0.0729, False, False)_get_param_groups name module.module.decoder.layers.20.mlp.linear_fc1.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.5.pre_mlp_layernorm.weight lr_decay_rate 0.13508517176729928_get_param_groups name module.module.decoder.layers.5.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.1.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.4.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.pre_mlp_layernorm.weight key (0.0, 0.03874204890000001, False, False) _get_param_groups name module.module.decoder.layers.4.mlp.linear_fc2.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.23.mlp.linear_fc2.weight lr_decay_rate 0.9_get_param_groups name module.module.decoder.layers.0.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.22.mlp.linear_fc1.weight lr_decay_rate 0.81_get_param_groups name module.module.decoder.layers.0.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.ls2 key (0.0, 0.016677181699666577, False, False) _get_param_groups name module.module.decoder.layers.20.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.self_attention.linear_qkv.bias key (0.0, 0.02287679245496101, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.mlp.linear_fc1.bias key (0.0, 0.03486784401000001, False, False)_get_param_groups name module.module.decoder.layers.5.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.21.pre_mlp_layernorm.bias lr_decay_rate 0.7290000000000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.mlp.linear_fc1.weight key (1.0, 0.08100000000000002, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.pre_mlp_layernorm.weight key (0.0, 0.013508517176729929, False, False)_get_param_groups name module.module.decoder.layers.0.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.1.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.mlp.linear_fc2.weight key (1.0, 0.09000000000000001, False, False)name module.module.external_feature_model.vit.decoder.layers.15.pre_mlp_layernorm.bias lr_decay_rate 0.3874204890000001 _get_param_groups name module.module.decoder.layers.5.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.4.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.21.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.0.mlp.linear_fc2.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.10.pre_mlp_layernorm.weight lr_decay_rate 0.2287679245496101name module.module.external_feature_model.vit.decoder.layers.7.input_layernorm.weight lr_decay_rate 0.16677181699666577 name module.module.external_feature_model.vit.decoder.layers.14.mlp.linear_fc2.weight lr_decay_rate 0.3486784401000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.pre_mlp_layernorm.bias key (0.0, 0.0729, False, False) name module.module.external_feature_model.vit.decoder.layers.5.pre_mlp_layernorm.bias lr_decay_rate 0.13508517176729928_get_param_groups name module.module.decoder.layers.5.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.22.mlp.linear_fc1.bias lr_decay_rate 0.81_get_param_groups name module.module.decoder.layers.2.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.0.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.23.mlp.linear_fc2.bias lr_decay_rate 0.9 _get_param_groups name module.module.decoder.layers.4.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.pre_mlp_layernorm.bias key (0.0, 0.03874204890000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.pre_mlp_layernorm.weight key (0.0, 0.02287679245496101, False, False) _get_param_groups name module.module.decoder.layers.5.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.1.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.21.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.input_layernorm.weight key (0.0, 0.016677181699666577, False, False) name module.module.external_feature_model.vit.decoder.layers.21.mlp.linear_fc1.weight lr_decay_rate 0.7290000000000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.mlp.linear_fc2.weight key (1.0, 0.03486784401000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.mlp.linear_fc2.bias key (0.0, 0.09000000000000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.pre_mlp_layernorm.bias key (0.0, 0.013508517176729929, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.mlp.linear_fc1.bias key (0.0, 0.08100000000000002, False, False) _get_param_groups name module.module.decoder.layers.5.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.5.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.15.mlp.linear_fc1.weight lr_decay_rate 0.3874204890000001_get_param_groups name module.module.decoder.layers.4.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.0.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.2.self_attention.linear_proj.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.10.pre_mlp_layernorm.bias lr_decay_rate 0.2287679245496101 _get_param_groups name module.module.decoder.layers.21.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.7.input_layernorm.bias lr_decay_rate 0.16677181699666577 _get_param_groups name module.module.decoder.layers.1.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.mlp.linear_fc1.weight key (1.0, 0.0729, False, False)name module.module.external_feature_model.vit.decoder.layers.14.mlp.linear_fc2.bias lr_decay_rate 0.3486784401000001 _get_param_groups name module.module.external_feature_model.vision_projection.encoder.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.mlp.linear_fc1.weight key (1.0, 0.03874204890000001, False, False) _get_param_groups name module.module.decoder.layers.5.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.0.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.5.input_layernorm.weight key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.5.mlp.linear_fc1.weight lr_decay_rate 0.13508517176729928 name module.module.external_feature_model.vit.decoder.layers.22.mlp.linear_fc2.weight lr_decay_rate 0.81_get_param_groups name module.module.decoder.layers.5.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.input_layernorm.bias key (0.0, 0.016677181699666577, False, False)_get_param_groups name module.module.decoder.layers.2.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.pre_mlp_layernorm.bias key (0.0, 0.02287679245496101, False, False) _get_param_groups name module.module.decoder.layers.21.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.1.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.mlp.linear_fc2.bias key (0.0, 0.03486784401000001, False, False)_get_param_groups name module.module.external_feature_model.vision_projection.encoder.linear_fc2.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.21.mlp.linear_fc1.bias lr_decay_rate 0.7290000000000001 _get_param_groups name module.module.decoder.layers.1.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.5.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.15.mlp.linear_fc1.bias lr_decay_rate 0.3874204890000001_get_param_groups name module.module.decoder.layers.5.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.mlp.linear_fc1.weight key (1.0, 0.013508517176729929, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.mlp.linear_fc2.weight key (1.0, 0.08100000000000002, False, False) _get_param_groups name module.module.decoder.layers.2.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.6.input_layernorm.weight key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.10.mlp.linear_fc1.weight lr_decay_rate 0.2287679245496101 name module.module.external_feature_model.vit.decoder.layers.7.self_attention.linear_proj.weight lr_decay_rate 0.16677181699666577_get_param_groups name module.module.decoder.layers.1.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.mlp.linear_fc1.bias key (0.0, 0.0729, False, False) _get_param_groups name module.module.external_feature_model.pre_proj_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.mlp.linear_fc1.bias key (0.0, 0.03874204890000001, False, False)_get_param_groups name module.module.decoder.layers.21.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.5.mlp.linear_fc1.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.15.ls1 lr_decay_rate 0.3874204890000001 name module.module.external_feature_model.vit.decoder.layers.22.mlp.linear_fc2.bias lr_decay_rate 0.81 _get_param_groups name module.module.decoder.layers.5.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.5.mlp.linear_fc1.bias lr_decay_rate 0.13508517176729928 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.mlp.linear_fc1.weight key (1.0, 0.02287679245496101, False, False)_get_param_groups name module.module.decoder.layers.2.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.1.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.self_attention.linear_proj.weight key (1.0, 0.016677181699666577, False, False) _get_param_groups name module.module.decoder.layers.6.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.1.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.5.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.pre_proj_layernorm.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.21.mlp.linear_fc1.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.21.mlp.linear_fc2.weight lr_decay_rate 0.7290000000000001name module.module.external_feature_model.vit.decoder.layers.15.mlp.linear_fc2.weight lr_decay_rate 0.3874204890000001 _get_param_groups name module.module.decoder.layers.5.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.ls1 key (0.0, 0.03874204890000001, False, False)_get_param_groups name module.module.decoder.layers.2.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.mlp.linear_fc2.bias key (0.0, 0.08100000000000002, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.mlp.linear_fc1.bias key (0.0, 0.013508517176729929, False, False) name module.module.external_feature_model.vit.decoder.layers.10.mlp.linear_fc1.bias lr_decay_rate 0.2287679245496101_get_param_groups name module.module.decoder.layers.1.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.6.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.1.mlp.linear_fc1.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.7.self_attention.linear_proj.bias lr_decay_rate 0.16677181699666577_get_param_groups name module.module.decoder.layers.21.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.embedding.word_embeddings.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.6.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.mlp.linear_fc2.weight key (1.0, 0.0729, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.mlp.linear_fc2.weight key (1.0, 0.03874204890000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.mlp.linear_fc1.bias key (0.0, 0.02287679245496101, False, False) name module.module.external_feature_model.vit.decoder.layers.23.ls1 lr_decay_rate 0.9_get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.self_attention.linear_proj.bias key (0.0, 0.016677181699666577, False, False) _get_param_groups name module.module.decoder.layers.5.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.15.ls2 lr_decay_rate 0.3874204890000001_get_param_groups name module.module.decoder.layers.2.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.1.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.6.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.5.mlp.linear_fc2.weight lr_decay_rate 0.13508517176729928_get_param_groups name module.module.decoder.layers.22.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.1.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.6.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.0.input_layernorm.weight key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.10.mlp.linear_fc2.weight lr_decay_rate 0.2287679245496101name module.module.external_feature_model.vit.decoder.layers.21.mlp.linear_fc2.bias lr_decay_rate 0.7290000000000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.ls1 key (0.0, 0.09000000000000001, False, False)name module.module.external_feature_model.vit.decoder.layers.15.mlp.linear_fc2.bias lr_decay_rate 0.3874204890000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.ls2 key (0.0, 0.03874204890000001, False, False) name module.module.external_feature_model.vit.decoder.layers.7.self_attention.linear_qkv.weight lr_decay_rate 0.16677181699666577 _get_param_groups name module.module.decoder.layers.5.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.3.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.6.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.mlp.linear_fc2.weight key (1.0, 0.013508517176729929, False, False)_get_param_groups name module.module.decoder.layers.22.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.6.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.1.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.mlp.linear_fc2.bias key (0.0, 0.0729, False, False) name module.module.external_feature_model.vit.decoder.layers.23.ls2 lr_decay_rate 0.9_get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.mlp.linear_fc2.weight key (1.0, 0.02287679245496101, False, False) name module.module.external_feature_model.vit.decoder.layers.15.input_layernorm.weight lr_decay_rate 0.3874204890000001_get_param_groups name module.module.decoder.layers.2.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.mlp.linear_fc2.bias key (0.0, 0.03874204890000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.self_attention.linear_qkv.weight key (1.0, 0.016677181699666577, False, False)_get_param_groups name module.module.decoder.layers.0.self_attention.linear_proj.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.5.mlp.linear_fc2.bias lr_decay_rate 0.13508517176729928_get_param_groups name module.module.decoder.layers.6.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.22.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.5.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.6.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.ls2 key (0.0, 0.09000000000000001, False, False)_get_param_groups name module.module.decoder.layers.3.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.input_layernorm.weight key (0.0, 0.03874204890000001, False, False)_get_param_groups name module.module.decoder.layers.1.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.2.self_attention.linear_proj.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.22.ls1 lr_decay_rate 0.81 name module.module.external_feature_model.vit.decoder.layers.10.mlp.linear_fc2.bias lr_decay_rate 0.2287679245496101 name module.module.external_feature_model.vit.decoder.layers.7.self_attention.linear_qkv.bias lr_decay_rate 0.16677181699666577name module.module.external_feature_model.vit.decoder.layers.16.ls1 lr_decay_rate 0.4304672100000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.mlp.linear_fc2.bias key (0.0, 0.013508517176729929, False, False)_get_param_groups name module.module.decoder.layers.6.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.0.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.22.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.6.mlp.linear_fc2.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.23.input_layernorm.weight lr_decay_rate 0.9 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.ls1 key (0.0, 0.08100000000000002, False, False)_get_param_groups name module.module.decoder.layers.6.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.3.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.mlp.linear_fc2.bias key (0.0, 0.02287679245496101, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.ls1 key (0.0, 0.04304672100000001, False, False) name module.module.external_feature_model.vit.decoder.layers.15.input_layernorm.bias lr_decay_rate 0.3874204890000001 _get_param_groups name module.module.decoder.layers.1.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.2.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.self_attention.linear_qkv.bias key (0.0, 0.016677181699666577, False, False)_get_param_groups name module.module.decoder.layers.0.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.input_layernorm.weight key (0.0, 0.09000000000000001, False, False)_get_param_groups name module.module.decoder.layers.22.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.6.ls1 lr_decay_rate 0.15009463529699918_get_param_groups name module.module.decoder.layers.6.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.6.mlp.linear_fc1.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.22.ls2 lr_decay_rate 0.81 _get_param_groups name module.module.decoder.layers.7.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.2.input_layernorm.weight key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.16.ls2 lr_decay_rate 0.4304672100000001 name module.module.external_feature_model.vit.decoder.layers.11.ls1 lr_decay_rate 0.2541865828329001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.input_layernorm.bias key (0.0, 0.03874204890000001, False, False)_get_param_groups name module.module.decoder.layers.3.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.2.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.23.input_layernorm.bias lr_decay_rate 0.9 _get_param_groups name module.module.decoder.layers.0.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.7.pre_mlp_layernorm.weight lr_decay_rate 0.16677181699666577 _get_param_groups name module.module.decoder.layers.22.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.ls1 key (0.0, 0.015009463529699918, False, False)_get_param_groups name module.module.decoder.layers.6.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.ls2 key (0.0, 0.08100000000000002, False, False)_get_param_groups name module.module.decoder.layers.6.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.7.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.ls2 key (0.0, 0.04304672100000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.input_layernorm.bias key (0.0, 0.09000000000000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.ls1 key (0.0, 0.02541865828329001, False, False)_get_param_groups name module.module.decoder.layers.2.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.0.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.pre_mlp_layernorm.weight key (0.0, 0.016677181699666577, False, False) _get_param_groups name module.module.decoder.layers.3.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.22.mlp.linear_fc2.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.15.self_attention.linear_proj.weight lr_decay_rate 0.3874204890000001_get_param_groups name module.module.decoder.layers.2.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.6.ls2 lr_decay_rate 0.15009463529699918_get_param_groups name module.module.decoder.layers.7.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.7.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.6.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.22.input_layernorm.weight lr_decay_rate 0.81 name module.module.external_feature_model.vit.decoder.layers.11.ls2 lr_decay_rate 0.2541865828329001 name module.module.external_feature_model.vit.decoder.layers.16.input_layernorm.weight lr_decay_rate 0.4304672100000001 name module.module.external_feature_model.vit.decoder.layers.7.pre_mlp_layernorm.bias lr_decay_rate 0.16677181699666577_get_param_groups name module.module.decoder.layers.2.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.23.self_attention.linear_proj.weight lr_decay_rate 0.9_get_param_groups name module.module.decoder.layers.0.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.3.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.23.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.7.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.self_attention.linear_proj.weight key (1.0, 0.03874204890000001, False, False) _get_param_groups name module.module.decoder.layers.7.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.2.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.ls2 key (0.0, 0.015009463529699918, False, False) _get_param_groups name module.module.decoder.layers.6.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.ls2 key (0.0, 0.02541865828329001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.input_layernorm.weight key (0.0, 0.08100000000000002, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.self_attention.linear_proj.weight key (1.0, 0.09000000000000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.input_layernorm.weight key (0.0, 0.04304672100000001, False, False)_get_param_groups name module.module.decoder.layers.2.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.pre_mlp_layernorm.bias key (0.0, 0.016677181699666577, False, False) _get_param_groups name module.module.decoder.layers.3.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.1.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.23.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.7.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.7.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.15.self_attention.linear_proj.bias lr_decay_rate 0.3874204890000001 name module.module.external_feature_model.vit.decoder.layers.23.self_attention.linear_proj.bias lr_decay_rate 0.9 _get_param_groups name module.module.decoder.layers.6.mlp.linear_fc1.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.6.input_layernorm.weight lr_decay_rate 0.15009463529699918_get_param_groups name module.module.decoder.layers.2.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.7.mlp.linear_fc1.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.11.input_layernorm.weight lr_decay_rate 0.2541865828329001name module.module.external_feature_model.vit.decoder.layers.22.input_layernorm.bias lr_decay_rate 0.81 _get_param_groups name module.module.decoder.layers.4.input_layernorm.weight key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.16.input_layernorm.bias lr_decay_rate 0.4304672100000001_get_param_groups name module.module.decoder.layers.2.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.1.self_attention.linear_proj.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.7.mlp.linear_fc1.weight lr_decay_rate 0.16677181699666577 _get_param_groups name module.module.decoder.layers.7.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.23.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.self_attention.linear_proj.bias key (0.0, 0.03874204890000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.self_attention.linear_proj.bias key (0.0, 0.09000000000000001, False, False) _get_param_groups name module.module.decoder.layers.6.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.2.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.3.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.input_layernorm.bias key (0.0, 0.08100000000000002, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.input_layernorm.weight key (0.0, 0.015009463529699918, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.input_layernorm.bias key (0.0, 0.04304672100000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.input_layernorm.weight key (0.0, 0.02541865828329001, False, False)_get_param_groups name module.module.decoder.layers.7.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.4.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.mlp.linear_fc1.weight key (1.0, 0.016677181699666577, False, False) name module.module.external_feature_model.vit.decoder.layers.23.self_attention.linear_qkv.weight lr_decay_rate 0.9_get_param_groups name module.module.decoder.layers.23.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.1.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.7.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.7.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.15.self_attention.linear_qkv.weight lr_decay_rate 0.3874204890000001 _get_param_groups name module.module.decoder.layers.2.mlp.linear_fc2.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.6.input_layernorm.bias lr_decay_rate 0.15009463529699918 _get_param_groups name module.module.decoder.layers.8.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.4.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.3.self_attention.linear_proj.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.22.self_attention.linear_proj.weight lr_decay_rate 0.81_get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.self_attention.linear_qkv.weight key (1.0, 0.09000000000000001, False, False)name module.module.external_feature_model.vit.decoder.layers.11.input_layernorm.bias lr_decay_rate 0.2541865828329001 _get_param_groups name module.module.decoder.layers.1.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.7.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.input_layernorm.bias key (0.0, 0.015009463529699918, False, False) name module.module.external_feature_model.vit.decoder.layers.7.mlp.linear_fc1.bias lr_decay_rate 0.16677181699666577_get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.self_attention.linear_qkv.weight key (1.0, 0.03874204890000001, False, False) _get_param_groups name module.module.decoder.layers.4.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.7.mlp.linear_fc1.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.16.self_attention.linear_proj.weight lr_decay_rate 0.4304672100000001_get_param_groups name module.module.decoder.layers.3.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.23.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.3.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.23.self_attention.linear_qkv.bias lr_decay_rate 0.9 _get_param_groups name module.module.decoder.layers.8.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.self_attention.linear_proj.weight key (1.0, 0.08100000000000002, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.input_layernorm.bias key (0.0, 0.02541865828329001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.self_attention.linear_proj.weight key (1.0, 0.04304672100000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.mlp.linear_fc1.bias key (0.0, 0.016677181699666577, False, False)_get_param_groups name module.module.decoder.layers.7.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.1.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.3.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.7.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.self_attention.linear_qkv.bias key (0.0, 0.09000000000000001, False, False)_get_param_groups name module.module.decoder.layers.4.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.3.self_attention.linear_proj.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.15.self_attention.linear_qkv.bias lr_decay_rate 0.3874204890000001_get_param_groups name module.module.decoder.layers.8.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.23.mlp.linear_fc1.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.6.self_attention.linear_proj.weight lr_decay_rate 0.15009463529699918 name module.module.external_feature_model.vit.decoder.layers.22.self_attention.linear_proj.bias lr_decay_rate 0.81 _get_param_groups name module.module.decoder.layers.7.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.16.self_attention.linear_proj.bias lr_decay_rate 0.4304672100000001 name module.module.external_feature_model.vit.decoder.layers.7.mlp.linear_fc2.weight lr_decay_rate 0.16677181699666577 name module.module.external_feature_model.vit.decoder.layers.11.self_attention.linear_proj.weight lr_decay_rate 0.2541865828329001 _get_param_groups name module.module.decoder.layers.3.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.3.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.8.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.1.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.4.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.self_attention.linear_qkv.bias key (0.0, 0.03874204890000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.self_attention.linear_proj.weight key (1.0, 0.015009463529699918, False, False)_get_param_groups name module.module.decoder.layers.8.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.self_attention.linear_proj.bias key (0.0, 0.04304672100000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.mlp.linear_fc2.weight key (1.0, 0.016677181699666577, False, False) _get_param_groups name module.module.decoder.layers.23.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.self_attention.linear_proj.weight key (1.0, 0.02541865828329001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.self_attention.linear_proj.bias key (0.0, 0.08100000000000002, False, False) name module.module.external_feature_model.vit.decoder.layers.23.pre_mlp_layernorm.weight lr_decay_rate 0.9 _get_param_groups name module.module.decoder.layers.3.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.7.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.3.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.4.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.1.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.8.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.11.self_attention.linear_proj.bias lr_decay_rate 0.2541865828329001 name module.module.external_feature_model.vit.decoder.layers.15.pre_mlp_layernorm.weight lr_decay_rate 0.3874204890000001_get_param_groups name module.module.decoder.layers.8.self_attention.linear_proj.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.7.mlp.linear_fc2.bias lr_decay_rate 0.16677181699666577name module.module.external_feature_model.vit.decoder.layers.22.self_attention.linear_qkv.weight lr_decay_rate 0.81name module.module.external_feature_model.vit.decoder.layers.6.self_attention.linear_proj.bias lr_decay_rate 0.15009463529699918 name module.module.external_feature_model.vit.decoder.layers.16.self_attention.linear_qkv.weight lr_decay_rate 0.4304672100000001 _get_param_groups name module.module.decoder.layers.24.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.pre_mlp_layernorm.weight key (0.0, 0.09000000000000001, False, False) _get_param_groups name module.module.decoder.layers.5.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.2.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.7.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.3.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.3.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.self_attention.linear_qkv.weight key (1.0, 0.08100000000000002, False, False)_get_param_groups name module.module.decoder.layers.8.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.pre_mlp_layernorm.weight key (0.0, 0.03874204890000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.self_attention.linear_proj.bias key (0.0, 0.015009463529699918, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.self_attention.linear_proj.bias key (0.0, 0.02541865828329001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.mlp.linear_fc2.bias key (0.0, 0.016677181699666577, False, False) _get_param_groups name module.module.decoder.layers.8.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.self_attention.linear_qkv.weight key (1.0, 0.04304672100000001, False, False) _get_param_groups name module.module.decoder.layers.24.self_attention.linear_proj.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.23.pre_mlp_layernorm.bias lr_decay_rate 0.9 _get_param_groups name module.module.decoder.layers.5.self_attention.linear_proj.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.22.self_attention.linear_qkv.bias lr_decay_rate 0.81_get_param_groups name module.module.decoder.layers.7.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.8.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.4.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.8.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.15.pre_mlp_layernorm.bias lr_decay_rate 0.3874204890000001_get_param_groups name module.module.decoder.layers.3.mlp.linear_fc1.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.8.ls1 lr_decay_rate 0.18530201888518416 name module.module.external_feature_model.vit.decoder.layers.6.self_attention.linear_qkv.weight lr_decay_rate 0.15009463529699918 _get_param_groups name module.module.decoder.layers.2.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.pre_mlp_layernorm.bias key (0.0, 0.09000000000000001, False, False)name module.module.external_feature_model.vit.decoder.layers.11.self_attention.linear_qkv.weight lr_decay_rate 0.2541865828329001name module.module.external_feature_model.vit.decoder.layers.16.self_attention.linear_qkv.bias lr_decay_rate 0.4304672100000001_get_param_groups name module.module.decoder.layers.24.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.8.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.self_attention.linear_qkv.bias key (0.0, 0.08100000000000002, False, False)_get_param_groups name module.module.decoder.layers.5.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.self_attention.linear_qkv.weight key (1.0, 0.015009463529699918, False, False)_get_param_groups name module.module.decoder.layers.9.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.4.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.pre_mlp_layernorm.bias key (0.0, 0.03874204890000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.ls1 key (0.0, 0.018530201888518418, False, False) _get_param_groups name module.module.decoder.layers.3.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.24.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.2.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.8.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.self_attention.linear_qkv.bias key (0.0, 0.04304672100000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.self_attention.linear_qkv.weight key (1.0, 0.02541865828329001, False, False) name module.module.external_feature_model.vit.decoder.layers.23.mlp.linear_fc1.weight lr_decay_rate 0.9_get_param_groups name module.module.decoder.layers.8.self_attention.linear_proj.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.6.self_attention.linear_qkv.bias lr_decay_rate 0.15009463529699918 name module.module.external_feature_model.vit.decoder.layers.8.ls2 lr_decay_rate 0.18530201888518416_get_param_groups name module.module.decoder.layers.5.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.22.pre_mlp_layernorm.weight lr_decay_rate 0.81_get_param_groups name module.module.decoder.layers.4.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.4.input_layernorm.weight key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.15.mlp.linear_fc1.weight lr_decay_rate 0.3874204890000001_get_param_groups name module.module.decoder.layers.2.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.9.self_attention.linear_proj.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.11.self_attention.linear_qkv.bias lr_decay_rate 0.2541865828329001 _get_param_groups name module.module.decoder.layers.8.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.24.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.8.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.ls2 key (0.0, 0.018530201888518418, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.mlp.linear_fc1.weight key (1.0, 0.09000000000000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.self_attention.linear_qkv.bias key (0.0, 0.015009463529699918, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.pre_mlp_layernorm.weight key (0.0, 0.08100000000000002, False, False)name module.module.external_feature_model.vit.decoder.layers.16.pre_mlp_layernorm.weight lr_decay_rate 0.4304672100000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.mlp.linear_fc1.weight key (1.0, 0.03874204890000001, False, False) _get_param_groups name module.module.decoder.layers.4.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.self_attention.linear_qkv.bias key (0.0, 0.02541865828329001, False, False) _get_param_groups name module.module.decoder.layers.5.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.4.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.8.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.8.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.24.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.9.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.2.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.8.input_layernorm.weight lr_decay_rate 0.18530201888518416 name module.module.external_feature_model.vit.decoder.layers.22.pre_mlp_layernorm.bias lr_decay_rate 0.81 name module.module.external_feature_model.vit.decoder.layers.23.mlp.linear_fc1.bias lr_decay_rate 0.9name module.module.external_feature_model.vit.decoder.layers.6.pre_mlp_layernorm.weight lr_decay_rate 0.15009463529699918name module.module.external_feature_model.vit.decoder.layers.15.mlp.linear_fc1.bias lr_decay_rate 0.3874204890000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.pre_mlp_layernorm.weight key (0.0, 0.04304672100000001, False, False) _get_param_groups name module.module.decoder.layers.9.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.5.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.24.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.4.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.4.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.11.pre_mlp_layernorm.weight lr_decay_rate 0.2541865828329001 _get_param_groups name module.module.decoder.layers.8.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.9.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.input_layernorm.weight key (0.0, 0.018530201888518418, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.pre_mlp_layernorm.weight key (0.0, 0.015009463529699918, False, False) _get_param_groups name module.module.decoder.layers.2.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.pre_mlp_layernorm.bias key (0.0, 0.08100000000000002, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.mlp.linear_fc1.bias key (0.0, 0.09000000000000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.mlp.linear_fc1.bias key (0.0, 0.03874204890000001, False, False)_get_param_groups name module.module.decoder.layers.9.self_attention.linear_proj.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.16.pre_mlp_layernorm.bias lr_decay_rate 0.4304672100000001 _get_param_groups name module.module.decoder.layers.25.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.4.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.5.mlp.linear_fc2.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.8.input_layernorm.bias lr_decay_rate 0.18530201888518416_get_param_groups name module.module.decoder.layers.4.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.8.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.pre_mlp_layernorm.weight key (0.0, 0.02541865828329001, False, False) _get_param_groups name module.module.decoder.layers.2.mlp.linear_fc2.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.6.pre_mlp_layernorm.bias lr_decay_rate 0.15009463529699918name module.module.external_feature_model.vit.decoder.layers.23.mlp.linear_fc2.weight lr_decay_rate 0.9_get_param_groups name module.module.decoder.layers.9.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.22.mlp.linear_fc1.weight lr_decay_rate 0.81 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.pre_mlp_layernorm.bias key (0.0, 0.04304672100000001, False, False)_get_param_groups name module.module.decoder.layers.6.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.4.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.9.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.4.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.8.mlp.linear_fc2.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.15.mlp.linear_fc2.weight lr_decay_rate 0.3874204890000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.input_layernorm.bias key (0.0, 0.018530201888518418, False, False)_get_param_groups name module.module.decoder.layers.25.self_attention.linear_proj.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.11.pre_mlp_layernorm.bias lr_decay_rate 0.2541865828329001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.pre_mlp_layernorm.bias key (0.0, 0.015009463529699918, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.mlp.linear_fc1.weight key (1.0, 0.08100000000000002, False, False) _get_param_groups name module.module.decoder.layers.3.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.mlp.linear_fc2.weight key (1.0, 0.09000000000000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.mlp.linear_fc2.weight key (1.0, 0.03874204890000001, False, False)_get_param_groups name module.module.decoder.layers.9.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.9.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.9.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.4.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.5.input_layernorm.weight key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.16.mlp.linear_fc1.weight lr_decay_rate 0.4304672100000001_get_param_groups name module.module.decoder.layers.25.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.6.mlp.linear_fc1.weight lr_decay_rate 0.15009463529699918_get_param_groups name module.module.decoder.layers.6.self_attention.linear_proj.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.22.mlp.linear_fc1.bias lr_decay_rate 0.81 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.pre_mlp_layernorm.bias key (0.0, 0.02541865828329001, False, False)name module.module.external_feature_model.vit.decoder.layers.8.self_attention.linear_proj.weight lr_decay_rate 0.18530201888518416 name module.module.external_feature_model.vit.decoder.layers.23.mlp.linear_fc2.bias lr_decay_rate 0.9 name module.module.external_feature_model.vit.decoder.layers.15.mlp.linear_fc2.bias lr_decay_rate 0.3874204890000001 _get_param_groups name module.module.decoder.layers.9.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.3.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.9.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.4.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.mlp.linear_fc1.weight key (1.0, 0.015009463529699918, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.mlp.linear_fc1.weight key (1.0, 0.04304672100000001, False, False) _get_param_groups name module.module.decoder.layers.25.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.9.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.mlp.linear_fc1.bias key (0.0, 0.08100000000000002, False, False)_get_param_groups name module.module.decoder.layers.6.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.11.mlp.linear_fc1.weight lr_decay_rate 0.2541865828329001 _get_param_groups name module.module.decoder.layers.5.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.self_attention.linear_proj.weight key (1.0, 0.018530201888518418, False, False) _get_param_groups name module.module.decoder.layers.9.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.mlp.linear_fc2.bias key (0.0, 0.03874204890000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.mlp.linear_fc2.bias key (0.0, 0.09000000000000001, False, False)name module.module.external_feature_model.vit.decoder.layers.6.mlp.linear_fc1.bias lr_decay_rate 0.15009463529699918_get_param_groups name module.module.decoder.layers.3.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.5.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.10.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.mlp.linear_fc1.weight key (1.0, 0.02541865828329001, False, False)name module.module.external_feature_model.vit.decoder.layers.16.mlp.linear_fc1.bias lr_decay_rate 0.4304672100000001_get_param_groups name module.module.decoder.layers.6.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.22.mlp.linear_fc2.weight lr_decay_rate 0.81 _get_param_groups name module.module.decoder.layers.9.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.9.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.25.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.5.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.16.ls1 lr_decay_rate 0.4304672100000001name module.module.external_feature_model.vit.decoder.layers.8.self_attention.linear_proj.bias lr_decay_rate 0.18530201888518416_get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.mlp.linear_fc1.bias key (0.0, 0.015009463529699918, False, False)_get_param_groups name module.module.decoder.layers.5.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.3.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.11.mlp.linear_fc1.bias lr_decay_rate 0.2541865828329001 _get_param_groups name module.module.decoder.layers.9.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.mlp.linear_fc1.bias key (0.0, 0.04304672100000001, False, False)_get_param_groups name module.module.decoder.layers.10.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.6.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vision_projection.encoder.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.mlp.linear_fc2.weight key (1.0, 0.08100000000000002, False, False) _get_param_groups name module.module.decoder.layers.10.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.5.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.ls1 key (0.0, 0.04304672100000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.mlp.linear_fc1.bias key (0.0, 0.02541865828329001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.self_attention.linear_proj.bias key (0.0, 0.018530201888518418, False, False)_get_param_groups name module.module.decoder.layers.25.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.3.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.5.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.6.mlp.linear_fc2.weight lr_decay_rate 0.15009463529699918_get_param_groups name module.module.decoder.layers.9.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.10.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vision_projection.encoder.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.6.mlp.linear_fc1.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.16.mlp.linear_fc2.weight lr_decay_rate 0.4304672100000001 name module.module.external_feature_model.vit.decoder.layers.22.mlp.linear_fc2.bias lr_decay_rate 0.81_get_param_groups name module.module.decoder.layers.10.self_attention.linear_proj.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.8.self_attention.linear_qkv.weight lr_decay_rate 0.18530201888518416 _get_param_groups name module.module.decoder.layers.5.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.16.ls2 lr_decay_rate 0.4304672100000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.mlp.linear_fc2.weight key (1.0, 0.015009463529699918, False, False)_get_param_groups name module.module.decoder.layers.5.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.25.mlp.linear_fc2.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.11.mlp.linear_fc2.weight lr_decay_rate 0.2541865828329001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.mlp.linear_fc2.weight key (1.0, 0.04304672100000001, False, False) _get_param_groups name module.module.decoder.layers.3.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.10.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.mlp.linear_fc2.bias key (0.0, 0.08100000000000002, False, False) _get_param_groups name module.module.decoder.layers.9.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.pre_proj_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.6.mlp.linear_fc2.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.6.mlp.linear_fc2.bias lr_decay_rate 0.15009463529699918_get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.self_attention.linear_qkv.weight key (1.0, 0.018530201888518418, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.ls2 key (0.0, 0.04304672100000001, False, False)_get_param_groups name module.module.decoder.layers.10.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.26.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.mlp.linear_fc2.weight key (1.0, 0.02541865828329001, False, False) name module.module.external_feature_model.vit.decoder.layers.16.mlp.linear_fc2.bias lr_decay_rate 0.4304672100000001 _get_param_groups name module.module.decoder.layers.3.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.5.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.9.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.10.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.5.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.pre_proj_layernorm.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.7.input_layernorm.weight key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.23.ls1 lr_decay_rate 0.9 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.mlp.linear_fc2.bias key (0.0, 0.015009463529699918, False, False) _get_param_groups name module.module.decoder.layers.10.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.8.self_attention.linear_qkv.bias lr_decay_rate 0.18530201888518416_get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.mlp.linear_fc2.bias key (0.0, 0.04304672100000001, False, False) name module.module.external_feature_model.vit.decoder.layers.16.input_layernorm.weight lr_decay_rate 0.4304672100000001 _get_param_groups name module.module.decoder.layers.4.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.26.self_attention.linear_proj.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.11.mlp.linear_fc2.bias lr_decay_rate 0.2541865828329001_get_param_groups name module.module.decoder.layers.5.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.10.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.5.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.10.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.7.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.embedding.word_embeddings.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.ls1 key (0.0, 0.09000000000000001, False, False) name module.module.external_feature_model.vit.decoder.layers.7.ls1 lr_decay_rate 0.16677181699666577_get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.self_attention.linear_qkv.bias key (0.0, 0.018530201888518418, False, False) _get_param_groups name module.module.decoder.layers.10.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.17.ls1 lr_decay_rate 0.4782969000000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.input_layernorm.weight key (0.0, 0.04304672100000001, False, False) _get_param_groups name module.module.decoder.layers.4.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.26.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.5.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.mlp.linear_fc2.bias key (0.0, 0.02541865828329001, False, False)_get_param_groups name module.module.decoder.layers.10.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.10.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.6.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.7.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.23.ls2 lr_decay_rate 0.9_get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.ls1 key (0.0, 0.016677181699666577, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.ls1 key (0.0, 0.04782969000000001, False, False) _get_param_groups name module.module.decoder.layers.10.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.0.input_layernorm.weight key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.16.input_layernorm.bias lr_decay_rate 0.4304672100000001 _get_param_groups name module.module.decoder.layers.4.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.26.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.6.input_layernorm.weight key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.8.pre_mlp_layernorm.weight lr_decay_rate 0.18530201888518416name module.module.external_feature_model.vit.decoder.layers.12.ls1 lr_decay_rate 0.2824295364810001 _get_param_groups name module.module.decoder.layers.10.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.7.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.11.input_layernorm.weight key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.7.ls2 lr_decay_rate 0.16677181699666577 _get_param_groups name module.module.decoder.layers.6.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.ls2 key (0.0, 0.09000000000000001, False, False) name module.module.external_feature_model.vit.decoder.layers.17.ls2 lr_decay_rate 0.4782969000000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.input_layernorm.bias key (0.0, 0.04304672100000001, False, False)_get_param_groups name module.module.decoder.layers.10.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.ls1 key (0.0, 0.028242953648100012, False, False) _get_param_groups name module.module.decoder.layers.4.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.0.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.10.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.pre_mlp_layernorm.weight key (0.0, 0.018530201888518418, False, False) _get_param_groups name module.module.decoder.layers.6.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.26.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.ls2 key (0.0, 0.016677181699666577, False, False)_get_param_groups name module.module.decoder.layers.11.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.6.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.23.input_layernorm.weight lr_decay_rate 0.9 _get_param_groups name module.module.decoder.layers.10.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.0.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.ls2 key (0.0, 0.04782969000000001, False, False)_get_param_groups name module.module.decoder.layers.7.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.11.input_layernorm.weight key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.12.ls2 lr_decay_rate 0.2824295364810001 _get_param_groups name module.module.decoder.layers.4.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.6.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.8.pre_mlp_layernorm.bias lr_decay_rate 0.18530201888518416 name module.module.external_feature_model.vit.decoder.layers.16.self_attention.linear_proj.weight lr_decay_rate 0.4304672100000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.input_layernorm.weight key (0.0, 0.09000000000000001, False, False)_get_param_groups name module.module.decoder.layers.26.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.6.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.11.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.7.input_layernorm.weight lr_decay_rate 0.16677181699666577 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.ls2 key (0.0, 0.028242953648100012, False, False) name module.module.external_feature_model.vit.decoder.layers.17.input_layernorm.weight lr_decay_rate 0.4782969000000001_get_param_groups name module.module.decoder.layers.6.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.10.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.4.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.0.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.7.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.11.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.pre_mlp_layernorm.bias key (0.0, 0.018530201888518418, False, False) name module.module.external_feature_model.vit.decoder.layers.23.input_layernorm.bias lr_decay_rate 0.9_get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.self_attention.linear_proj.weight key (1.0, 0.04304672100000001, False, False)_get_param_groups name module.module.decoder.layers.26.mlp.linear_fc2.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.12.input_layernorm.weight lr_decay_rate 0.2824295364810001_get_param_groups name module.module.decoder.layers.11.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.6.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.4.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.input_layernorm.weight key (0.0, 0.016677181699666577, False, False) _get_param_groups name module.module.decoder.layers.7.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.input_layernorm.weight key (0.0, 0.04782969000000001, False, False) _get_param_groups name module.module.decoder.layers.10.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.11.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.6.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.8.mlp.linear_fc1.weight lr_decay_rate 0.18530201888518416 _get_param_groups name module.module.decoder.layers.0.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.input_layernorm.bias key (0.0, 0.09000000000000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.input_layernorm.weight key (0.0, 0.028242953648100012, False, False) _get_param_groups name module.module.decoder.layers.27.input_layernorm.weight key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.16.self_attention.linear_proj.bias lr_decay_rate 0.4304672100000001 _get_param_groups name module.module.decoder.layers.6.mlp.linear_fc1.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.class_token lr_decay_rate 1.0 name module.module.external_feature_model.vit.decoder.layers.7.input_layernorm.bias lr_decay_rate 0.16677181699666577 _get_param_groups name module.module.decoder.layers.11.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.11.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.11.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.5.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.8.input_layernorm.weight key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.17.input_layernorm.bias lr_decay_rate 0.4782969000000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.mlp.linear_fc1.weight key (1.0, 0.018530201888518418, False, False)_get_param_groups name module.module.decoder.layers.6.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.0.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.6.mlp.linear_fc2.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.12.input_layernorm.bias lr_decay_rate 0.2824295364810001_get_param_groups name module.module.decoder.layers.27.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.self_attention.linear_proj.bias key (0.0, 0.04304672100000001, False, False) name module.module.external_feature_model.vit.decoder.layers.23.self_attention.linear_proj.weight lr_decay_rate 0.9 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.input_layernorm.bias key (0.0, 0.016677181699666577, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.input_layernorm.bias key (0.0, 0.04782969000000001, False, False) _get_param_groups name module.module.decoder.layers.11.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.6.mlp.linear_fc2.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.8.mlp.linear_fc1.bias lr_decay_rate 0.18530201888518416 _get_param_groups name module.module.decoder.layers.11.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.0.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.input_layernorm.bias key (0.0, 0.028242953648100012, False, False)_get_param_groups name module.module.decoder.layers.11.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.5.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.7.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.8.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.27.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.mlp.linear_fc1.bias key (0.0, 0.018530201888518418, False, False) name module.module.external_feature_model.vit.decoder.layers.16.self_attention.linear_qkv.weight lr_decay_rate 0.4304672100000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.self_attention.linear_proj.weight key (1.0, 0.09000000000000001, False, False)_get_param_groups name module.module.decoder.layers.11.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.11.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.11.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.1.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.7.input_layernorm.weight key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.7.self_attention.linear_proj.weight lr_decay_rate 0.16677181699666577name module.module.external_feature_model.vit.decoder.layers.17.self_attention.linear_proj.weight lr_decay_rate 0.4782969000000001 _get_param_groups name module.module.decoder.layers.5.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.27.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.8.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.7.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.12.input_layernorm.weight key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.12.self_attention.linear_proj.weight lr_decay_rate 0.2824295364810001 name module.module.external_feature_model.vit.decoder.layers.8.mlp.linear_fc2.weight lr_decay_rate 0.18530201888518416_get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.self_attention.linear_qkv.weight key (1.0, 0.04304672100000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.self_attention.linear_proj.weight key (1.0, 0.04782969000000001, False, False) name module.module.external_feature_model.vit.decoder.layers.23.self_attention.linear_proj.bias lr_decay_rate 0.9 _get_param_groups name module.module.decoder.layers.11.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.11.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.self_attention.linear_proj.weight key (1.0, 0.016677181699666577, False, False)_get_param_groups name module.module.decoder.layers.7.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.5.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.1.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.self_attention.linear_proj.weight key (1.0, 0.028242953648100012, False, False)_get_param_groups name module.module.decoder.layers.8.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.17.self_attention.linear_proj.bias lr_decay_rate 0.4782969000000001 _get_param_groups name module.module.decoder.layers.7.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.27.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.12.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.mlp.linear_fc2.weight key (1.0, 0.018530201888518418, False, False) name module.module.external_feature_model.vit.decoder.layers.16.self_attention.linear_qkv.bias lr_decay_rate 0.4304672100000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.self_attention.linear_proj.bias key (0.0, 0.09000000000000001, False, False) name module.module.external_feature_model.vit.decoder.layers.7.self_attention.linear_proj.bias lr_decay_rate 0.16677181699666577_get_param_groups name module.module.decoder.layers.12.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.7.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.11.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.1.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.self_attention.linear_proj.bias key (0.0, 0.04782969000000001, False, False) _get_param_groups name module.module.decoder.layers.5.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.27.mlp.linear_fc1.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.12.self_attention.linear_proj.bias lr_decay_rate 0.2824295364810001 name module.module.external_feature_model.vit.decoder.layers.23.self_attention.linear_qkv.weight lr_decay_rate 0.9_get_param_groups name module.module.decoder.layers.7.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.12.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.8.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.8.mlp.linear_fc2.bias lr_decay_rate 0.18530201888518416 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.self_attention.linear_qkv.bias key (0.0, 0.04304672100000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.self_attention.linear_proj.bias key (0.0, 0.016677181699666577, False, False)_get_param_groups name module.module.decoder.layers.7.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.11.mlp.linear_fc1.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.17.self_attention.linear_qkv.weight lr_decay_rate 0.4782969000000001_get_param_groups name module.module.decoder.layers.12.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.self_attention.linear_proj.bias key (0.0, 0.028242953648100012, False, False) _get_param_groups name module.module.decoder.layers.1.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.27.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.5.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.8.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.12.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.self_attention.linear_qkv.weight key (1.0, 0.09000000000000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.mlp.linear_fc2.bias key (0.0, 0.018530201888518418, False, False) _get_param_groups name module.module.external_feature_model.vit.class_token key (1.0, 0.1, False, False) _get_param_groups name module.module.decoder.layers.7.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.16.pre_mlp_layernorm.weight lr_decay_rate 0.4304672100000001name module.module.external_feature_model.vit.decoder.layers.7.self_attention.linear_qkv.weight lr_decay_rate 0.16677181699666577_get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.self_attention.linear_qkv.weight key (1.0, 0.04782969000000001, False, False) _get_param_groups name module.module.decoder.layers.12.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.1.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.11.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.28.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.7.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.12.self_attention.linear_qkv.weight lr_decay_rate 0.2824295364810001 _get_param_groups name module.module.decoder.layers.5.mlp.linear_fc2.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.23.self_attention.linear_qkv.bias lr_decay_rate 0.9 _get_param_groups name module.module.decoder.layers.8.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.12.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.9.ls1 lr_decay_rate 0.20589113209464907_get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.pre_mlp_layernorm.weight key (0.0, 0.04304672100000001, False, False)_get_param_groups name module.module.decoder.layers.7.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.1.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.12.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.self_attention.linear_qkv.weight key (1.0, 0.016677181699666577, False, False) _get_param_groups name module.module.decoder.layers.28.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.self_attention.linear_qkv.bias key (0.0, 0.09000000000000001, False, False)name module.module.external_feature_model.vit.decoder.layers.17.self_attention.linear_qkv.bias lr_decay_rate 0.4782969000000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.self_attention.linear_qkv.weight key (1.0, 0.028242953648100012, False, False)name module.module.external_feature_model.vit.conv1.weight lr_decay_rate 0.0717897987691853_get_param_groups name module.module.decoder.layers.7.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.9.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.6.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.12.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.28.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.12.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.ls1 key (0.0, 0.02058911320946491, False, False) _get_param_groups name module.module.decoder.layers.1.mlp.linear_fc2.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.16.pre_mlp_layernorm.bias lr_decay_rate 0.4304672100000001_get_param_groups name module.module.decoder.layers.7.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.7.mlp.linear_fc2.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.12.self_attention.linear_qkv.bias lr_decay_rate 0.2824295364810001 _get_param_groups name module.module.decoder.layers.12.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.self_attention.linear_qkv.bias key (0.0, 0.04782969000000001, False, False) name module.module.external_feature_model.vit.decoder.layers.7.self_attention.linear_qkv.bias lr_decay_rate 0.16677181699666577 _get_param_groups name module.module.decoder.layers.28.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.23.pre_mlp_layernorm.weight lr_decay_rate 0.9 _get_param_groups name module.module.external_feature_model.vit.conv1.weight key (1.0, 0.00717897987691853, False, False)_get_param_groups name module.module.decoder.layers.9.self_attention.linear_proj.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.9.ls2 lr_decay_rate 0.20589113209464907 _get_param_groups name module.module.decoder.layers.6.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.12.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.self_attention.linear_qkv.bias key (0.0, 0.028242953648100012, False, False)_get_param_groups name module.module.decoder.layers.12.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.pre_mlp_layernorm.bias key (0.0, 0.04304672100000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.self_attention.linear_qkv.bias key (0.0, 0.016677181699666577, False, False) _get_param_groups name module.module.decoder.layers.12.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.2.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.8.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.8.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.ls2 key (0.0, 0.02058911320946491, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.pre_mlp_layernorm.weight key (0.0, 0.09000000000000001, False, False)name module.module.external_feature_model.vit.conv1.bias lr_decay_rate 0.0717897987691853_get_param_groups name module.module.decoder.layers.28.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.12.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.9.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.7.pre_mlp_layernorm.weight lr_decay_rate 0.16677181699666577name module.module.external_feature_model.vit.decoder.layers.17.pre_mlp_layernorm.weight lr_decay_rate 0.4782969000000001_get_param_groups name module.module.decoder.layers.13.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.12.mlp.linear_fc2.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.16.mlp.linear_fc1.weight lr_decay_rate 0.4304672100000001name module.module.external_feature_model.vit.decoder.layers.12.pre_mlp_layernorm.weight lr_decay_rate 0.2824295364810001 _get_param_groups name module.module.decoder.layers.2.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.6.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.8.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.8.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.pre_mlp_layernorm.weight key (0.0, 0.04782969000000001, False, False) _get_param_groups name module.module.decoder.layers.9.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.9.input_layernorm.weight lr_decay_rate 0.20589113209464907 _get_param_groups name module.module.decoder.layers.13.self_attention.linear_proj.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.23.pre_mlp_layernorm.bias lr_decay_rate 0.9 _get_param_groups name module.module.decoder.layers.12.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.28.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.pre_mlp_layernorm.weight key (0.0, 0.016677181699666577, False, False) _get_param_groups name module.module.external_feature_model.vit.conv1.bias key (0.0, 0.00717897987691853, False, False)_get_param_groups name module.module.decoder.layers.6.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.13.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.pre_mlp_layernorm.weight key (0.0, 0.028242953648100012, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.mlp.linear_fc1.weight key (1.0, 0.04304672100000001, False, False) _get_param_groups name module.module.decoder.layers.2.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.8.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.8.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.17.pre_mlp_layernorm.bias lr_decay_rate 0.4782969000000001 _get_param_groups name module.module.decoder.layers.13.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.9.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.28.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.input_layernorm.weight key (0.0, 0.02058911320946491, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.pre_mlp_layernorm.bias key (0.0, 0.09000000000000001, False, False) _get_param_groups name module.module.decoder.layers.6.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.16.mlp.linear_fc1.bias lr_decay_rate 0.4304672100000001 _get_param_groups name module.module.decoder.layers.2.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.7.pre_mlp_layernorm.bias lr_decay_rate 0.16677181699666577 _get_param_groups name module.module.decoder.layers.8.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.12.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.12.pre_mlp_layernorm.bias lr_decay_rate 0.2824295364810001name module.module.external_feature_model.vit.position_embeddings.weight lr_decay_rate 0.0717897987691853 _get_param_groups name module.module.decoder.layers.8.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.13.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.mlp.linear_fc1.bias key (0.0, 0.04304672100000001, False, False)_get_param_groups name module.module.decoder.layers.29.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.pre_mlp_layernorm.bias key (0.0, 0.04782969000000001, False, False) _get_param_groups name module.module.decoder.layers.13.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.9.mlp.linear_fc1.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.9.input_layernorm.bias lr_decay_rate 0.20589113209464907 name module.module.external_feature_model.vit.decoder.layers.23.mlp.linear_fc1.weight lr_decay_rate 0.9_get_param_groups name module.module.decoder.layers.2.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.pre_mlp_layernorm.bias key (0.0, 0.028242953648100012, False, False)_get_param_groups name module.module.decoder.layers.6.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.pre_mlp_layernorm.bias key (0.0, 0.016677181699666577, False, False) _get_param_groups name module.module.decoder.layers.12.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.8.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.13.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.16.mlp.linear_fc2.weight lr_decay_rate 0.4304672100000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.input_layernorm.bias key (0.0, 0.02058911320946491, False, False)_get_param_groups name module.module.external_feature_model.vit.position_embeddings.weight key (1.0, 0.00717897987691853, False, False) _get_param_groups name module.module.decoder.layers.9.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.8.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.29.self_attention.linear_proj.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.17.mlp.linear_fc1.weight lr_decay_rate 0.4782969000000001_get_param_groups name module.module.decoder.layers.2.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.6.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.13.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.mlp.linear_fc1.weight key (1.0, 0.09000000000000001, False, False) _get_param_groups name module.module.decoder.layers.13.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.12.mlp.linear_fc2.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.12.mlp.linear_fc1.weight lr_decay_rate 0.2824295364810001name module.module.external_feature_model.vit.decoder.layers.7.mlp.linear_fc1.weight lr_decay_rate 0.16677181699666577 _get_param_groups name module.module.decoder.layers.8.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.mlp.linear_fc2.weight key (1.0, 0.04304672100000001, False, False) name module.module.external_feature_model.vit.decoder.layers.9.self_attention.linear_proj.weight lr_decay_rate 0.20589113209464907 _get_param_groups name module.module.decoder.layers.13.mlp.linear_fc1.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.0.ls1 lr_decay_rate 0.07976644307687256 _get_param_groups name module.module.decoder.layers.7.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.10.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.8.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.29.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.mlp.linear_fc1.weight key (1.0, 0.04782969000000001, False, False)_get_param_groups name module.module.decoder.layers.2.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.13.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.16.mlp.linear_fc2.bias lr_decay_rate 0.4304672100000001name module.module.external_feature_model.vit.decoder.layers.23.mlp.linear_fc1.bias lr_decay_rate 0.9 _get_param_groups name module.module.decoder.layers.8.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.mlp.linear_fc1.weight key (1.0, 0.028242953648100012, False, False) _get_param_groups name module.module.decoder.layers.13.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.mlp.linear_fc1.weight key (1.0, 0.016677181699666577, False, False) _get_param_groups name module.module.decoder.layers.13.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.8.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.self_attention.linear_proj.weight key (1.0, 0.02058911320946491, False, False)_get_param_groups name module.module.decoder.layers.7.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.10.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.mlp.linear_fc2.bias key (0.0, 0.04304672100000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.ls1 key (0.0, 0.007976644307687256, False, False) _get_param_groups name module.module.decoder.layers.29.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.3.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.mlp.linear_fc1.bias key (0.0, 0.09000000000000001, False, False) _get_param_groups name module.module.decoder.layers.13.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.13.self_attention.linear_proj.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.17.mlp.linear_fc1.bias lr_decay_rate 0.4782969000000001_get_param_groups name module.module.decoder.layers.9.input_layernorm.weight key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.12.mlp.linear_fc1.bias lr_decay_rate 0.2824295364810001 _get_param_groups name module.module.decoder.layers.9.input_layernorm.weight key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.7.mlp.linear_fc1.bias lr_decay_rate 0.16677181699666577_get_param_groups name module.module.decoder.layers.7.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.14.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.3.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.10.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.9.self_attention.linear_proj.bias lr_decay_rate 0.20589113209464907 name module.module.external_feature_model.vit.decoder.layers.17.ls1 lr_decay_rate 0.4782969000000001name module.module.external_feature_model.vit.decoder.layers.0.ls2 lr_decay_rate 0.07976644307687256 _get_param_groups name module.module.decoder.layers.29.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.13.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.13.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.7.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.mlp.linear_fc1.bias key (0.0, 0.04782969000000001, False, False) name module.module.external_feature_model.vit.decoder.layers.23.mlp.linear_fc2.weight lr_decay_rate 0.9_get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.mlp.linear_fc1.bias key (0.0, 0.028242953648100012, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.mlp.linear_fc1.bias key (0.0, 0.016677181699666577, False, False)_get_param_groups name module.module.decoder.layers.9.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.10.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.ls1 key (0.0, 0.04782969000000001, False, False)_get_param_groups name module.module.decoder.layers.3.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.9.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.self_attention.linear_proj.bias key (0.0, 0.02058911320946491, False, False) _get_param_groups name module.module.decoder.layers.29.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.13.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.14.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.ls2 key (0.0, 0.007976644307687256, False, False) name module.module.external_feature_model.vit.decoder.layers.17.mlp.linear_fc2.weight lr_decay_rate 0.4782969000000001 _get_param_groups name module.module.decoder.layers.14.input_layernorm.weight key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.7.mlp.linear_fc2.weight lr_decay_rate 0.16677181699666577 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.mlp.linear_fc2.weight key (1.0, 0.09000000000000001, False, False)_get_param_groups name module.module.decoder.layers.7.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.3.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.12.mlp.linear_fc2.weight lr_decay_rate 0.2824295364810001 name module.module.external_feature_model.vit.decoder.layers.17.ls2 lr_decay_rate 0.4782969000000001_get_param_groups name module.module.decoder.layers.9.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.9.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.10.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.29.mlp.linear_fc2.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.9.self_attention.linear_qkv.weight lr_decay_rate 0.20589113209464907_get_param_groups name module.module.decoder.layers.13.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.mlp.linear_fc2.weight key (1.0, 0.016677181699666577, False, False) _get_param_groups name module.module.decoder.layers.14.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.mlp.linear_fc2.weight key (1.0, 0.04782969000000001, False, False) _get_param_groups name module.module.decoder.layers.9.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.0.input_layernorm.weight lr_decay_rate 0.07976644307687256_get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.ls2 key (0.0, 0.04782969000000001, False, False)_get_param_groups name module.module.decoder.layers.9.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.14.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.mlp.linear_fc2.weight key (1.0, 0.028242953648100012, False, False)_get_param_groups name module.module.decoder.layers.3.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.23.mlp.linear_fc2.bias lr_decay_rate 0.9_get_param_groups name module.module.decoder.layers.7.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.14.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.10.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.30.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.13.mlp.linear_fc1.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.17.mlp.linear_fc2.bias lr_decay_rate 0.4782969000000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.self_attention.linear_qkv.weight key (1.0, 0.02058911320946491, False, False) name module.module.external_feature_model.vit.decoder.layers.7.mlp.linear_fc2.bias lr_decay_rate 0.16677181699666577 name module.module.external_feature_model.vit.decoder.layers.12.mlp.linear_fc2.bias lr_decay_rate 0.2824295364810001_get_param_groups name module.module.decoder.layers.9.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.17.input_layernorm.weight lr_decay_rate 0.4782969000000001_get_param_groups name module.module.decoder.layers.3.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.input_layernorm.weight key (0.0, 0.007976644307687256, False, False)_get_param_groups name module.module.decoder.layers.14.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.mlp.linear_fc2.bias key (0.0, 0.09000000000000001, False, False) _get_param_groups name module.module.decoder.layers.9.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.7.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.mlp.linear_fc2.bias key (0.0, 0.04782969000000001, False, False)_get_param_groups name module.module.decoder.layers.30.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.mlp.linear_fc2.bias key (0.0, 0.016677181699666577, False, False)name module.module.external_feature_model.vit.decoder.layers.9.self_attention.linear_qkv.bias lr_decay_rate 0.20589113209464907_get_param_groups name module.module.decoder.layers.10.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.13.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.14.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.input_layernorm.weight key (0.0, 0.04782969000000001, False, False) _get_param_groups name module.module.decoder.layers.3.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.mlp.linear_fc2.bias key (0.0, 0.028242953648100012, False, False) _get_param_groups name module.module.decoder.layers.14.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.8.input_layernorm.weight key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.0.input_layernorm.bias lr_decay_rate 0.07976644307687256 _get_param_groups name module.module.decoder.layers.9.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.30.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.8.ls1 lr_decay_rate 0.18530201888518416_get_param_groups name module.module.external_feature_model.vision_projection.encoder.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.self_attention.linear_qkv.bias key (0.0, 0.02058911320946491, False, False)_get_param_groups name module.module.decoder.layers.11.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.9.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.14.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.4.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.input_layernorm.bias key (0.0, 0.007976644307687256, False, False) _get_param_groups name module.module.decoder.layers.8.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.14.input_layernorm.weight key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.17.input_layernorm.bias lr_decay_rate 0.4782969000000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.ls1 key (0.0, 0.018530201888518418, False, False)name module.module.external_feature_model.vit.decoder.layers.18.ls1 lr_decay_rate 0.531441_get_param_groups name module.module.decoder.layers.9.mlp.linear_fc2.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.13.ls1 lr_decay_rate 0.31381059609000006_get_param_groups name module.module.decoder.layers.14.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.30.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.4.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.9.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vision_projection.encoder.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.14.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.11.self_attention.linear_proj.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.9.pre_mlp_layernorm.weight lr_decay_rate 0.20589113209464907name module.module.external_feature_model.vit.decoder.layers.8.ls2 lr_decay_rate 0.18530201888518416name module.module.external_feature_model.vit.decoder.layers.0.self_attention.linear_proj.weight lr_decay_rate 0.07976644307687256 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.ls1 key (0.0, 0.031381059609000006, False, False)_get_param_groups name module.module.decoder.layers.10.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.14.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.14.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.8.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.input_layernorm.bias key (0.0, 0.04782969000000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.ls1 key (0.0, 0.05314410000000001, False, False) _get_param_groups name module.module.decoder.layers.4.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.30.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.10.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.pre_mlp_layernorm.weight key (0.0, 0.02058911320946491, False, False)_get_param_groups name module.module.external_feature_model.pre_proj_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.15.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.self_attention.linear_proj.weight key (1.0, 0.007976644307687256, False, False)_get_param_groups name module.module.decoder.layers.11.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.8.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.13.ls2 lr_decay_rate 0.31381059609000006_get_param_groups name module.module.decoder.layers.14.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.10.self_attention.linear_proj.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.17.self_attention.linear_proj.weight lr_decay_rate 0.4782969000000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.ls2 key (0.0, 0.018530201888518418, False, False) _get_param_groups name module.module.decoder.layers.14.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.30.mlp.linear_fc1.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.9.pre_mlp_layernorm.bias lr_decay_rate 0.20589113209464907 _get_param_groups name module.module.decoder.layers.10.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.4.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.18.ls2 lr_decay_rate 0.531441 _get_param_groups name module.module.external_feature_model.pre_proj_layernorm.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.11.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.self_attention.linear_proj.weight key (1.0, 0.04782969000000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.ls2 key (0.0, 0.031381059609000006, False, False) _get_param_groups name module.module.decoder.layers.8.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.pre_mlp_layernorm.bias key (0.0, 0.02058911320946491, False, False) _get_param_groups name module.module.decoder.layers.14.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.0.self_attention.linear_proj.bias lr_decay_rate 0.07976644307687256_get_param_groups name module.module.decoder.layers.10.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.10.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.15.self_attention.linear_proj.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.8.input_layernorm.weight lr_decay_rate 0.18530201888518416_get_param_groups name module.module.decoder.layers.15.input_layernorm.weight key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.9.mlp.linear_fc1.weight lr_decay_rate 0.20589113209464907_get_param_groups name module.module.decoder.layers.30.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.ls2 key (0.0, 0.05314410000000001, False, False) _get_param_groups name module.module.embedding.word_embeddings.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.self_attention.linear_proj.bias key (0.0, 0.007976644307687256, False, False)_get_param_groups name module.module.decoder.layers.4.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.17.self_attention.linear_proj.bias lr_decay_rate 0.4782969000000001 _get_param_groups name module.module.decoder.layers.8.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.14.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.13.input_layernorm.weight lr_decay_rate 0.31381059609000006_get_param_groups name module.module.decoder.layers.10.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.11.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.input_layernorm.weight key (0.0, 0.018530201888518418, False, False) _get_param_groups name module.module.decoder.layers.10.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.15.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.15.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.31.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.mlp.linear_fc1.weight key (1.0, 0.02058911320946491, False, False) name module.module.external_feature_model.vit.decoder.layers.18.input_layernorm.weight lr_decay_rate 0.531441_get_param_groups name module.module.decoder.layers.4.mlp.linear_fc1.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.0.self_attention.linear_qkv.weight lr_decay_rate 0.07976644307687256_get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.self_attention.linear_proj.bias key (0.0, 0.04782969000000001, False, False) _get_param_groups name module.module.decoder.layers.11.mlp.linear_fc1.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.8.input_layernorm.bias lr_decay_rate 0.18530201888518416_get_param_groups name module.module.decoder.layers.14.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.8.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.0.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.15.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.input_layernorm.weight key (0.0, 0.031381059609000006, False, False)_get_param_groups name module.module.decoder.layers.15.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.9.mlp.linear_fc1.bias lr_decay_rate 0.20589113209464907 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.input_layernorm.bias key (0.0, 0.018530201888518418, False, False)_get_param_groups name module.module.decoder.layers.10.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.10.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.input_layernorm.weight key (0.0, 0.05314410000000001, False, False)_get_param_groups name module.module.decoder.layers.31.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.4.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.14.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.self_attention.linear_qkv.weight key (1.0, 0.007976644307687256, False, False) name module.module.external_feature_model.vit.decoder.layers.17.self_attention.linear_qkv.weight lr_decay_rate 0.4782969000000001_get_param_groups name module.module.decoder.layers.11.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.9.input_layernorm.weight key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.13.input_layernorm.bias lr_decay_rate 0.31381059609000006 _get_param_groups name module.module.decoder.layers.15.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.15.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.10.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.10.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.mlp.linear_fc1.bias key (0.0, 0.02058911320946491, False, False) _get_param_groups name module.module.decoder.layers.0.self_attention.linear_proj.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.18.input_layernorm.bias lr_decay_rate 0.531441_get_param_groups name module.module.decoder.layers.31.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.self_attention.linear_qkv.weight key (1.0, 0.04782969000000001, False, False)_get_param_groups name module.module.decoder.layers.9.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.5.input_layernorm.weight key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.8.self_attention.linear_proj.weight lr_decay_rate 0.18530201888518416name module.module.external_feature_model.vit.decoder.layers.0.self_attention.linear_qkv.bias lr_decay_rate 0.07976644307687256 _get_param_groups name module.module.decoder.layers.15.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.12.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.10.mlp.linear_fc2.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.9.mlp.linear_fc2.weight lr_decay_rate 0.20589113209464907 _get_param_groups name module.module.decoder.layers.15.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.input_layernorm.bias key (0.0, 0.031381059609000006, False, False) _get_param_groups name module.module.decoder.layers.15.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.31.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.10.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.0.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.9.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.self_attention.linear_proj.weight key (1.0, 0.018530201888518418, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.input_layernorm.bias key (0.0, 0.05314410000000001, False, False) _get_param_groups name module.module.decoder.layers.15.self_attention.linear_proj.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.17.self_attention.linear_qkv.bias lr_decay_rate 0.4782969000000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.self_attention.linear_qkv.bias key (0.0, 0.007976644307687256, False, False) _get_param_groups name module.module.decoder.layers.5.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.15.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.mlp.linear_fc2.weight key (1.0, 0.02058911320946491, False, False)_get_param_groups name module.module.decoder.layers.11.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.12.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.15.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.31.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.9.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.0.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.11.input_layernorm.weight key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.13.self_attention.linear_proj.weight lr_decay_rate 0.31381059609000006 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.self_attention.linear_qkv.bias key (0.0, 0.04782969000000001, False, False)_get_param_groups name module.module.decoder.layers.15.mlp.linear_fc2.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.18.self_attention.linear_proj.weight lr_decay_rate 0.531441name module.module.external_feature_model.vit.decoder.layers.8.self_attention.linear_proj.bias lr_decay_rate 0.18530201888518416 _get_param_groups name module.module.decoder.layers.16.input_layernorm.weight key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.0.pre_mlp_layernorm.weight lr_decay_rate 0.07976644307687256_get_param_groups name module.module.decoder.layers.15.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.12.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.5.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.11.self_attention.linear_proj.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.9.mlp.linear_fc2.bias lr_decay_rate 0.20589113209464907 _get_param_groups name module.module.decoder.layers.31.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.self_attention.linear_proj.weight key (1.0, 0.031381059609000006, False, False)_get_param_groups name module.module.decoder.layers.9.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.11.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.self_attention.linear_proj.weight key (1.0, 0.05314410000000001, False, False)_get_param_groups name module.module.decoder.layers.0.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.pre_mlp_layernorm.weight key (0.0, 0.007976644307687256, False, False)_get_param_groups name module.module.decoder.layers.15.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.self_attention.linear_proj.bias key (0.0, 0.018530201888518418, False, False)_get_param_groups name module.module.decoder.layers.16.input_layernorm.weight key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.17.pre_mlp_layernorm.weight lr_decay_rate 0.4782969000000001 _get_param_groups name module.module.decoder.layers.12.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.5.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.11.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.16.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.9.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.mlp.linear_fc2.bias key (0.0, 0.02058911320946491, False, False)name module.module.external_feature_model.vit.decoder.layers.13.self_attention.linear_proj.bias lr_decay_rate 0.31381059609000006 _get_param_groups name module.module.decoder.layers.31.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.11.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.18.self_attention.linear_proj.bias lr_decay_rate 0.531441 _get_param_groups name module.module.decoder.layers.15.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.0.pre_mlp_layernorm.bias lr_decay_rate 0.07976644307687256_get_param_groups name module.module.decoder.layers.0.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.16.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.self_attention.linear_proj.bias key (0.0, 0.031381059609000006, False, False) _get_param_groups name module.module.decoder.layers.16.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.8.self_attention.linear_qkv.weight lr_decay_rate 0.18530201888518416_get_param_groups name module.module.decoder.layers.9.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.pre_mlp_layernorm.weight key (0.0, 0.04782969000000001, False, False) _get_param_groups name module.module.decoder.layers.11.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.12.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.5.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.10.ls1 lr_decay_rate 0.2287679245496101_get_param_groups name module.module.decoder.layers.32.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.pre_mlp_layernorm.bias key (0.0, 0.007976644307687256, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.self_attention.linear_proj.bias key (0.0, 0.05314410000000001, False, False)_get_param_groups name module.module.decoder.layers.11.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.16.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.10.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.15.mlp.linear_fc1.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.13.self_attention.linear_qkv.weight lr_decay_rate 0.31381059609000006 _get_param_groups name module.module.decoder.layers.0.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.16.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.self_attention.linear_qkv.weight key (1.0, 0.018530201888518418, False, False)_get_param_groups name module.module.decoder.layers.11.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.ls1 key (0.0, 0.02287679245496101, False, False)_get_param_groups name module.module.decoder.layers.12.mlp.linear_fc1.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.17.pre_mlp_layernorm.bias lr_decay_rate 0.4782969000000001 _get_param_groups name module.module.decoder.layers.32.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.5.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.10.self_attention.linear_proj.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.18.self_attention.linear_qkv.weight lr_decay_rate 0.531441_get_param_groups name module.module.decoder.layers.16.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.0.mlp.linear_fc1.weight lr_decay_rate 0.07976644307687256 _get_param_groups name module.module.decoder.layers.15.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.11.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.self_attention.linear_qkv.weight key (1.0, 0.031381059609000006, False, False)_get_param_groups name module.module.decoder.layers.16.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.10.ls2 lr_decay_rate 0.2287679245496101name module.module.external_feature_model.vit.decoder.layers.8.self_attention.linear_qkv.bias lr_decay_rate 0.18530201888518416_get_param_groups name module.module.decoder.layers.12.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.mlp.linear_fc1.weight key (1.0, 0.007976644307687256, False, False) _get_param_groups name module.module.decoder.layers.5.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.10.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.1.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.11.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.self_attention.linear_qkv.weight key (1.0, 0.05314410000000001, False, False) _get_param_groups name module.module.decoder.layers.16.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.pre_mlp_layernorm.bias key (0.0, 0.04782969000000001, False, False) _get_param_groups name module.module.decoder.layers.32.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.16.input_layernorm.weight key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.13.self_attention.linear_qkv.bias lr_decay_rate 0.31381059609000006_get_param_groups name module.module.decoder.layers.11.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.16.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.ls2 key (0.0, 0.02287679245496101, False, False) name module.module.external_feature_model.vit.decoder.layers.18.self_attention.linear_qkv.bias lr_decay_rate 0.531441 _get_param_groups name module.module.decoder.layers.6.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.self_attention.linear_qkv.bias key (0.0, 0.018530201888518418, False, False)_get_param_groups name module.module.decoder.layers.16.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.13.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.10.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.0.mlp.linear_fc1.bias lr_decay_rate 0.07976644307687256 _get_param_groups name module.module.decoder.layers.11.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.32.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.11.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.1.self_attention.linear_proj.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.17.mlp.linear_fc1.weight lr_decay_rate 0.4782969000000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.self_attention.linear_qkv.bias key (0.0, 0.031381059609000006, False, False) _get_param_groups name module.module.decoder.layers.16.self_attention.linear_proj.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.10.input_layernorm.weight lr_decay_rate 0.2287679245496101_get_param_groups name module.module.decoder.layers.16.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.self_attention.linear_qkv.bias key (0.0, 0.05314410000000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.mlp.linear_fc1.bias key (0.0, 0.007976644307687256, False, False) _get_param_groups name module.module.decoder.layers.16.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.13.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.10.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.6.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.mlp.linear_fc1.weight key (1.0, 0.04782969000000001, False, False)_get_param_groups name module.module.decoder.layers.12.input_layernorm.weight key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.8.pre_mlp_layernorm.weight lr_decay_rate 0.18530201888518416 _get_param_groups name module.module.decoder.layers.12.input_layernorm.weight key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.13.pre_mlp_layernorm.weight lr_decay_rate 0.31381059609000006_get_param_groups name module.module.decoder.layers.32.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.1.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.17.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.input_layernorm.weight key (0.0, 0.02287679245496101, False, False)_get_param_groups name module.module.decoder.layers.16.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.0.mlp.linear_fc2.weight lr_decay_rate 0.07976644307687256 _get_param_groups name module.module.decoder.layers.10.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.17.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.13.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.18.pre_mlp_layernorm.weight lr_decay_rate 0.531441 _get_param_groups name module.module.decoder.layers.6.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.17.mlp.linear_fc1.bias lr_decay_rate 0.4782969000000001 _get_param_groups name module.module.decoder.layers.12.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.pre_mlp_layernorm.weight key (0.0, 0.031381059609000006, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.pre_mlp_layernorm.weight key (0.0, 0.018530201888518418, False, False)_get_param_groups name module.module.decoder.layers.32.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.16.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.17.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.1.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.13.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.10.input_layernorm.bias lr_decay_rate 0.2287679245496101_get_param_groups name module.module.decoder.layers.12.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.17.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.6.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.12.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.mlp.linear_fc2.weight key (1.0, 0.007976644307687256, False, False) _get_param_groups name module.module.decoder.layers.10.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.pre_mlp_layernorm.weight key (0.0, 0.05314410000000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.mlp.linear_fc1.bias key (0.0, 0.04782969000000001, False, False) name module.module.external_feature_model.vit.decoder.layers.13.pre_mlp_layernorm.bias lr_decay_rate 0.31381059609000006name module.module.external_feature_model.vit.decoder.layers.8.pre_mlp_layernorm.bias lr_decay_rate 0.18530201888518416 _get_param_groups name module.module.decoder.layers.32.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.input_layernorm.bias key (0.0, 0.02287679245496101, False, False) _get_param_groups name module.module.decoder.layers.12.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.1.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.0.mlp.linear_fc2.bias lr_decay_rate 0.07976644307687256_get_param_groups name module.module.decoder.layers.16.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.17.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.12.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.17.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.13.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.pre_mlp_layernorm.bias key (0.0, 0.018530201888518418, False, False)name module.module.external_feature_model.vit.decoder.layers.17.mlp.linear_fc2.weight lr_decay_rate 0.4782969000000001 _get_param_groups name module.module.decoder.layers.11.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.6.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.18.pre_mlp_layernorm.bias lr_decay_rate 0.531441_get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.pre_mlp_layernorm.bias key (0.0, 0.031381059609000006, False, False) name module.module.external_feature_model.vit.decoder.layers.10.self_attention.linear_proj.weight lr_decay_rate 0.2287679245496101_get_param_groups name module.module.decoder.layers.33.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.1.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.12.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.0.mlp.linear_fc2.bias key (0.0, 0.007976644307687256, False, False) _get_param_groups name module.module.decoder.layers.16.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.11.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.mlp.linear_fc2.weight key (1.0, 0.04782969000000001, False, False)_get_param_groups name module.module.decoder.layers.17.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.6.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.17.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.pre_mlp_layernorm.bias key (0.0, 0.05314410000000001, False, False) _get_param_groups name module.module.decoder.layers.12.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.13.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.self_attention.linear_proj.weight key (1.0, 0.02287679245496101, False, False)_get_param_groups name module.module.decoder.layers.1.mlp.linear_fc2.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.8.mlp.linear_fc1.weight lr_decay_rate 0.18530201888518416 name module.module.external_feature_model.vit.decoder.layers.13.mlp.linear_fc1.weight lr_decay_rate 0.31381059609000006_get_param_groups name module.module.decoder.layers.33.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.12.mlp.linear_fc1.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.1.ls1 lr_decay_rate 0.08862938119652507 _get_param_groups name module.module.decoder.layers.6.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.11.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.16.mlp.linear_fc2.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.17.mlp.linear_fc2.bias lr_decay_rate 0.4782969000000001 name module.module.external_feature_model.vit.decoder.layers.10.self_attention.linear_proj.bias lr_decay_rate 0.2287679245496101 _get_param_groups name module.module.decoder.layers.13.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.17.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.17.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.18.mlp.linear_fc1.weight lr_decay_rate 0.531441 _get_param_groups name module.module.decoder.layers.12.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.mlp.linear_fc1.weight key (1.0, 0.018530201888518418, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.ls1 key (0.0, 0.008862938119652507, False, False) _get_param_groups name module.module.decoder.layers.11.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.mlp.linear_fc1.weight key (1.0, 0.031381059609000006, False, False)_get_param_groups name module.module.decoder.layers.2.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.33.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.17.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.12.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.mlp.linear_fc2.bias key (0.0, 0.04782969000000001, False, False) _get_param_groups name module.module.decoder.layers.7.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.self_attention.linear_proj.bias key (0.0, 0.02287679245496101, False, False)_get_param_groups name module.module.decoder.layers.17.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.mlp.linear_fc1.weight key (1.0, 0.05314410000000001, False, False) _get_param_groups name module.module.decoder.layers.17.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.12.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.14.input_layernorm.weight key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.1.ls2 lr_decay_rate 0.08862938119652507_get_param_groups name module.module.decoder.layers.33.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.8.mlp.linear_fc1.bias lr_decay_rate 0.18530201888518416 name module.module.external_feature_model.vit.decoder.layers.13.mlp.linear_fc1.bias lr_decay_rate 0.31381059609000006_get_param_groups name module.module.decoder.layers.13.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.7.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.11.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.2.self_attention.linear_proj.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.18.mlp.linear_fc1.bias lr_decay_rate 0.531441_get_param_groups name module.module.decoder.layers.17.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.14.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.17.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.17.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.mlp.linear_fc1.bias key (0.0, 0.031381059609000006, False, False)name module.module.external_feature_model.vit.decoder.layers.10.self_attention.linear_qkv.weight lr_decay_rate 0.2287679245496101 name module.module.external_feature_model.vit.decoder.layers.18.ls1 lr_decay_rate 0.531441 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.mlp.linear_fc1.bias key (0.0, 0.018530201888518418, False, False)_get_param_groups name module.module.decoder.layers.12.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.7.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.ls2 key (0.0, 0.008862938119652507, False, False)_get_param_groups name module.module.decoder.layers.13.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.11.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.2.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.mlp.linear_fc1.bias key (0.0, 0.05314410000000001, False, False) _get_param_groups name module.module.decoder.layers.18.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.33.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.17.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.14.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.18.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.self_attention.linear_qkv.weight key (1.0, 0.02287679245496101, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.ls1 key (0.0, 0.05314410000000001, False, False)name module.module.external_feature_model.vit.decoder.layers.13.mlp.linear_fc2.weight lr_decay_rate 0.31381059609000006_get_param_groups name module.module.decoder.layers.7.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.13.input_layernorm.weight key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.8.mlp.linear_fc2.weight lr_decay_rate 0.18530201888518416 _get_param_groups name module.module.decoder.layers.13.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.2.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.1.input_layernorm.weight lr_decay_rate 0.08862938119652507_get_param_groups name module.module.decoder.layers.11.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.14.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.33.mlp.linear_fc1.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.18.mlp.linear_fc2.weight lr_decay_rate 0.531441 _get_param_groups name module.module.decoder.layers.17.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.18.self_attention.linear_proj.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.10.self_attention.linear_qkv.bias lr_decay_rate 0.2287679245496101 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.mlp.linear_fc2.weight key (1.0, 0.031381059609000006, False, False) _get_param_groups name module.module.decoder.layers.18.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.7.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.18.ls2 lr_decay_rate 0.531441 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.input_layernorm.weight key (0.0, 0.008862938119652507, False, False) _get_param_groups name module.module.decoder.layers.13.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.mlp.linear_fc2.weight key (1.0, 0.05314410000000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.mlp.linear_fc2.weight key (1.0, 0.018530201888518418, False, False) _get_param_groups name module.module.decoder.layers.13.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.33.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.self_attention.linear_qkv.bias key (0.0, 0.02287679245496101, False, False)_get_param_groups name module.module.decoder.layers.14.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.17.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.12.input_layernorm.weight key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.13.mlp.linear_fc2.bias lr_decay_rate 0.31381059609000006_get_param_groups name module.module.decoder.layers.2.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.18.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.ls2 key (0.0, 0.05314410000000001, False, False) _get_param_groups name module.module.decoder.layers.18.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.7.mlp.linear_fc1.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.1.input_layernorm.bias lr_decay_rate 0.08862938119652507 name module.module.external_feature_model.vit.decoder.layers.18.mlp.linear_fc2.bias lr_decay_rate 0.531441 _get_param_groups name module.module.decoder.layers.13.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.13.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.8.mlp.linear_fc2.bias lr_decay_rate 0.18530201888518416 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.input_layernorm.bias key (0.0, 0.008862938119652507, False, False)_get_param_groups name module.module.decoder.layers.34.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.mlp.linear_fc2.bias key (0.0, 0.031381059609000006, False, False)_get_param_groups name module.module.decoder.layers.14.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.17.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.18.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.10.pre_mlp_layernorm.weight lr_decay_rate 0.2287679245496101 _get_param_groups name module.module.decoder.layers.2.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.13.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.12.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.18.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.18.input_layernorm.weight lr_decay_rate 0.531441 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.mlp.linear_fc2.bias key (0.0, 0.05314410000000001, False, False)_get_param_groups name module.module.decoder.layers.7.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.13.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.mlp.linear_fc2.bias key (0.0, 0.018530201888518418, False, False) _get_param_groups name module.module.decoder.layers.17.mlp.linear_fc2.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.1.self_attention.linear_proj.weight lr_decay_rate 0.08862938119652507 _get_param_groups name module.module.decoder.layers.14.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.18.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.34.self_attention.linear_proj.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.14.ls1 lr_decay_rate 0.3486784401000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.pre_mlp_layernorm.weight key (0.0, 0.02287679245496101, False, False) _get_param_groups name module.module.decoder.layers.2.mlp.linear_fc2.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.19.ls1 lr_decay_rate 0.5904900000000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.input_layernorm.weight key (0.0, 0.05314410000000001, False, False) _get_param_groups name module.module.decoder.layers.12.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.13.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.13.mlp.linear_fc2.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.9.ls1 lr_decay_rate 0.20589113209464907_get_param_groups name module.module.decoder.layers.18.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.10.pre_mlp_layernorm.bias lr_decay_rate 0.2287679245496101_get_param_groups name module.module.decoder.layers.15.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.18.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.8.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.ls1 key (0.0, 0.05904900000000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.self_attention.linear_proj.weight key (1.0, 0.008862938119652507, False, False)_get_param_groups name module.module.decoder.layers.34.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.ls1 key (0.0, 0.03486784401000001, False, False)_get_param_groups name module.module.decoder.layers.18.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.3.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.12.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.18.input_layernorm.bias lr_decay_rate 0.531441 _get_param_groups name module.module.decoder.layers.34.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.13.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.pre_mlp_layernorm.bias key (0.0, 0.02287679245496101, False, False) _get_param_groups name module.module.decoder.layers.14.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.18.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.ls1 key (0.0, 0.02058911320946491, False, False) _get_param_groups name module.module.decoder.layers.15.self_attention.linear_proj.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.19.ls2 lr_decay_rate 0.5904900000000001_get_param_groups name module.module.decoder.layers.18.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.8.self_attention.linear_proj.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.1.self_attention.linear_proj.bias lr_decay_rate 0.08862938119652507 _get_param_groups name module.module.decoder.layers.18.mlp.linear_fc2.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.14.ls2 lr_decay_rate 0.3486784401000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.input_layernorm.bias key (0.0, 0.05314410000000001, False, False)_get_param_groups name module.module.decoder.layers.13.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.12.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.18.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.3.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.34.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.ls2 key (0.0, 0.05904900000000001, False, False) _get_param_groups name module.module.decoder.layers.14.self_attention.linear_proj.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.9.ls2 lr_decay_rate 0.20589113209464907 name module.module.external_feature_model.vit.decoder.layers.10.mlp.linear_fc1.weight lr_decay_rate 0.2287679245496101 _get_param_groups name module.module.decoder.layers.15.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.self_attention.linear_proj.bias key (0.0, 0.008862938119652507, False, False) _get_param_groups name module.module.decoder.layers.8.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.18.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.ls2 key (0.0, 0.03486784401000001, False, False)_get_param_groups name module.module.decoder.layers.19.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.12.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.14.input_layernorm.weight key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.18.self_attention.linear_proj.weight lr_decay_rate 0.531441_get_param_groups name module.module.decoder.layers.19.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.mlp.linear_fc1.weight key (1.0, 0.02287679245496101, False, False) _get_param_groups name module.module.decoder.layers.3.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.34.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.14.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.19.input_layernorm.weight lr_decay_rate 0.5904900000000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.ls2 key (0.0, 0.02058911320946491, False, False)_get_param_groups name module.module.decoder.layers.15.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.self_attention.linear_proj.weight key (1.0, 0.05314410000000001, False, False)_get_param_groups name module.module.decoder.layers.19.self_attention.linear_proj.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.10.mlp.linear_fc1.bias lr_decay_rate 0.2287679245496101_get_param_groups name module.module.decoder.layers.12.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.8.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.18.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.3.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.1.self_attention.linear_qkv.weight lr_decay_rate 0.08862938119652507 name module.module.external_feature_model.vit.decoder.layers.14.input_layernorm.weight lr_decay_rate 0.3486784401000001 _get_param_groups name module.module.decoder.layers.14.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.19.self_attention.linear_proj.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.9.input_layernorm.weight lr_decay_rate 0.20589113209464907 _get_param_groups name module.module.decoder.layers.15.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.14.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.input_layernorm.weight key (0.0, 0.05904900000000001, False, False) _get_param_groups name module.module.decoder.layers.34.mlp.linear_fc2.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.18.self_attention.linear_proj.bias lr_decay_rate 0.531441 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.mlp.linear_fc1.bias key (0.0, 0.02287679245496101, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.input_layernorm.weight key (0.0, 0.02058911320946491, False, False)_get_param_groups name module.module.decoder.layers.19.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.8.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.self_attention.linear_qkv.weight key (1.0, 0.008862938119652507, False, False)_get_param_groups name module.module.decoder.layers.13.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.input_layernorm.weight key (0.0, 0.03486784401000001, False, False) _get_param_groups name module.module.decoder.layers.18.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.14.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.3.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.19.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.self_attention.linear_proj.bias key (0.0, 0.05314410000000001, False, False)_get_param_groups name module.module.decoder.layers.15.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.14.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.19.input_layernorm.bias lr_decay_rate 0.5904900000000001_get_param_groups name module.module.decoder.layers.35.input_layernorm.weight key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.14.input_layernorm.bias lr_decay_rate 0.3486784401000001 name module.module.external_feature_model.vit.decoder.layers.10.mlp.linear_fc2.weight lr_decay_rate 0.2287679245496101 _get_param_groups name module.module.decoder.layers.8.mlp.linear_fc1.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.1.self_attention.linear_qkv.bias lr_decay_rate 0.08862938119652507 _get_param_groups name module.module.decoder.layers.18.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.19.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.13.self_attention.linear_proj.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.9.input_layernorm.bias lr_decay_rate 0.20589113209464907_get_param_groups name module.module.decoder.layers.14.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.self_attention.linear_qkv.bias key (0.0, 0.008862938119652507, False, False) _get_param_groups name module.module.decoder.layers.8.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.input_layernorm.bias key (0.0, 0.05904900000000001, False, False)_get_param_groups name module.module.decoder.layers.15.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.19.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.3.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.35.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.mlp.linear_fc2.weight key (1.0, 0.02287679245496101, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.input_layernorm.bias key (0.0, 0.03486784401000001, False, False) _get_param_groups name module.module.decoder.layers.18.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.14.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.18.self_attention.linear_qkv.weight lr_decay_rate 0.531441 _get_param_groups name module.module.decoder.layers.13.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.input_layernorm.bias key (0.0, 0.02058911320946491, False, False)_get_param_groups name module.module.decoder.layers.19.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.14.mlp.linear_fc2.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.1.pre_mlp_layernorm.weight lr_decay_rate 0.08862938119652507name module.module.external_feature_model.vit.decoder.layers.10.mlp.linear_fc2.bias lr_decay_rate 0.2287679245496101 _get_param_groups name module.module.decoder.layers.9.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.3.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.16.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.35.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.14.self_attention.linear_proj.weight lr_decay_rate 0.3486784401000001_get_param_groups name module.module.decoder.layers.13.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.19.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.19.self_attention.linear_proj.weight lr_decay_rate 0.5904900000000001 _get_param_groups name module.module.decoder.layers.19.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.self_attention.linear_qkv.weight key (1.0, 0.05314410000000001, False, False)_get_param_groups name module.module.decoder.layers.14.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.15.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.pre_mlp_layernorm.weight key (0.0, 0.008862938119652507, False, False) _get_param_groups name module.module.decoder.layers.19.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.mlp.linear_fc2.bias key (0.0, 0.02287679245496101, False, False) _get_param_groups name module.module.decoder.layers.9.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.4.input_layernorm.weight key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.9.self_attention.linear_proj.weight lr_decay_rate 0.20589113209464907 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.self_attention.linear_proj.weight key (1.0, 0.03486784401000001, False, False) _get_param_groups name module.module.decoder.layers.35.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.19.mlp.linear_fc1.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.18.self_attention.linear_qkv.bias lr_decay_rate 0.531441_get_param_groups name module.module.decoder.layers.16.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.14.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.self_attention.linear_proj.weight key (1.0, 0.05904900000000001, False, False)_get_param_groups name module.module.decoder.layers.13.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.19.self_attention.linear_proj.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.1.pre_mlp_layernorm.bias lr_decay_rate 0.08862938119652507_get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.self_attention.linear_proj.weight key (1.0, 0.02058911320946491, False, False)_get_param_groups name module.module.decoder.layers.15.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.9.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.19.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.self_attention.linear_qkv.bias key (0.0, 0.05314410000000001, False, False) _get_param_groups name module.module.decoder.layers.19.mlp.linear_fc2.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.11.ls1 lr_decay_rate 0.2541865828329001 _get_param_groups name module.module.decoder.layers.4.self_attention.linear_proj.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.14.self_attention.linear_proj.bias lr_decay_rate 0.3486784401000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.pre_mlp_layernorm.bias key (0.0, 0.008862938119652507, False, False)_get_param_groups name module.module.decoder.layers.35.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.16.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.15.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.9.self_attention.linear_proj.bias lr_decay_rate 0.20589113209464907_get_param_groups name module.module.decoder.layers.20.input_layernorm.weight key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.19.self_attention.linear_proj.bias lr_decay_rate 0.5904900000000001 _get_param_groups name module.module.decoder.layers.13.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.19.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.14.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.9.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.self_attention.linear_proj.bias key (0.0, 0.03486784401000001, False, False) name module.module.external_feature_model.vit.decoder.layers.18.pre_mlp_layernorm.weight lr_decay_rate 0.531441 _get_param_groups name module.module.decoder.layers.20.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.ls1 key (0.0, 0.02541865828329001, False, False)_get_param_groups name module.module.decoder.layers.4.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.1.mlp.linear_fc1.weight lr_decay_rate 0.08862938119652507 _get_param_groups name module.module.decoder.layers.15.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.35.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.self_attention.linear_proj.bias key (0.0, 0.05904900000000001, False, False)_get_param_groups name module.module.decoder.layers.19.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.20.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.16.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.self_attention.linear_proj.bias key (0.0, 0.02058911320946491, False, False)_get_param_groups name module.module.decoder.layers.9.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.14.self_attention.linear_qkv.weight lr_decay_rate 0.3486784401000001_get_param_groups name module.module.decoder.layers.13.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.20.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.15.input_layernorm.weight key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.11.ls2 lr_decay_rate 0.2541865828329001_get_param_groups name module.module.decoder.layers.4.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.mlp.linear_fc1.weight key (1.0, 0.008862938119652507, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.pre_mlp_layernorm.weight key (0.0, 0.05314410000000001, False, False)_get_param_groups name module.module.decoder.layers.19.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.15.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.35.mlp.linear_fc2.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.19.self_attention.linear_qkv.weight lr_decay_rate 0.5904900000000001 _get_param_groups name module.module.decoder.layers.20.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.self_attention.linear_qkv.weight key (1.0, 0.03486784401000001, False, False) _get_param_groups name module.module.decoder.layers.16.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.ls2 key (0.0, 0.02541865828329001, False, False) name module.module.external_feature_model.vit.decoder.layers.1.mlp.linear_fc1.bias lr_decay_rate 0.08862938119652507 _get_param_groups name module.module.decoder.layers.9.mlp.linear_fc1.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.9.self_attention.linear_qkv.weight lr_decay_rate 0.20589113209464907_get_param_groups name module.module.decoder.layers.20.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.18.pre_mlp_layernorm.bias lr_decay_rate 0.531441_get_param_groups name module.module.decoder.layers.14.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.15.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.19.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.15.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.36.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.self_attention.linear_qkv.weight key (1.0, 0.05904900000000001, False, False)_get_param_groups name module.module.decoder.layers.4.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.self_attention.linear_qkv.weight key (1.0, 0.02058911320946491, False, False)_get_param_groups name module.module.decoder.layers.20.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.14.self_attention.linear_qkv.bias lr_decay_rate 0.3486784401000001 _get_param_groups name module.module.decoder.layers.20.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.11.input_layernorm.weight lr_decay_rate 0.2541865828329001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.mlp.linear_fc1.bias key (0.0, 0.008862938119652507, False, False) _get_param_groups name module.module.decoder.layers.16.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.15.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.9.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.pre_mlp_layernorm.bias key (0.0, 0.05314410000000001, False, False) _get_param_groups name module.module.decoder.layers.14.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.15.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.19.mlp.linear_fc2.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.19.self_attention.linear_qkv.bias lr_decay_rate 0.5904900000000001_get_param_groups name module.module.decoder.layers.4.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.self_attention.linear_qkv.bias key (0.0, 0.03486784401000001, False, False)_get_param_groups name module.module.decoder.layers.36.self_attention.linear_proj.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.9.self_attention.linear_qkv.bias lr_decay_rate 0.20589113209464907_get_param_groups name module.module.decoder.layers.20.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.16.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.16.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.input_layernorm.weight key (0.0, 0.02541865828329001, False, False)_get_param_groups name module.module.decoder.layers.10.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.20.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.14.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.15.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.1.mlp.linear_fc2.weight lr_decay_rate 0.08862938119652507 _get_param_groups name module.module.decoder.layers.20.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.self_attention.linear_qkv.bias key (0.0, 0.05904900000000001, False, False)name module.module.external_feature_model.vit.decoder.layers.18.mlp.linear_fc1.weight lr_decay_rate 0.531441 _get_param_groups name module.module.decoder.layers.4.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.20.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.self_attention.linear_qkv.bias key (0.0, 0.02058911320946491, False, False)_get_param_groups name module.module.decoder.layers.36.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.17.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.16.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.14.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.14.pre_mlp_layernorm.weight lr_decay_rate 0.3486784401000001name module.module.external_feature_model.vit.decoder.layers.11.input_layernorm.bias lr_decay_rate 0.2541865828329001_get_param_groups name module.module.decoder.layers.20.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.10.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.mlp.linear_fc2.weight key (1.0, 0.008862938119652507, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.mlp.linear_fc1.weight key (1.0, 0.05314410000000001, False, False) _get_param_groups name module.module.decoder.layers.15.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.36.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.20.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.20.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.5.input_layernorm.weight key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.19.pre_mlp_layernorm.weight lr_decay_rate 0.5904900000000001name module.module.external_feature_model.vit.decoder.layers.9.pre_mlp_layernorm.weight lr_decay_rate 0.20589113209464907 _get_param_groups name module.module.decoder.layers.17.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.pre_mlp_layernorm.weight key (0.0, 0.03486784401000001, False, False)_get_param_groups name module.module.decoder.layers.16.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.input_layernorm.bias key (0.0, 0.02541865828329001, False, False)_get_param_groups name module.module.decoder.layers.20.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.20.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.14.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.10.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.1.mlp.linear_fc2.bias lr_decay_rate 0.08862938119652507 name module.module.external_feature_model.vit.decoder.layers.18.mlp.linear_fc1.bias lr_decay_rate 0.531441 _get_param_groups name module.module.decoder.layers.17.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.21.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.15.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.pre_mlp_layernorm.weight key (0.0, 0.05904900000000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.pre_mlp_layernorm.weight key (0.0, 0.02058911320946491, False, False)_get_param_groups name module.module.decoder.layers.5.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.21.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.36.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.20.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.16.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.10.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.14.pre_mlp_layernorm.bias lr_decay_rate 0.3486784401000001 _get_param_groups name module.module.decoder.layers.14.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.1.mlp.linear_fc2.bias key (0.0, 0.008862938119652507, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.mlp.linear_fc1.bias key (0.0, 0.05314410000000001, False, False) name module.module.external_feature_model.vit.decoder.layers.19.pre_mlp_layernorm.bias lr_decay_rate 0.5904900000000001_get_param_groups name module.module.decoder.layers.17.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.11.self_attention.linear_proj.weight lr_decay_rate 0.2541865828329001_get_param_groups name module.module.decoder.layers.15.mlp.linear_fc2.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.9.pre_mlp_layernorm.bias lr_decay_rate 0.20589113209464907 _get_param_groups name module.module.decoder.layers.21.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.10.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.21.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.pre_mlp_layernorm.bias key (0.0, 0.03486784401000001, False, False) _get_param_groups name module.module.decoder.layers.20.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.5.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.36.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.16.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.14.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.pre_mlp_layernorm.bias key (0.0, 0.05904900000000001, False, False) name module.module.external_feature_model.vit.decoder.layers.18.mlp.linear_fc2.weight lr_decay_rate 0.531441_get_param_groups name module.module.decoder.layers.16.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.self_attention.linear_proj.weight key (1.0, 0.02541865828329001, False, False) name module.module.external_feature_model.vit.decoder.layers.2.ls1 lr_decay_rate 0.09847709021836118_get_param_groups name module.module.decoder.layers.21.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.17.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.pre_mlp_layernorm.bias key (0.0, 0.02058911320946491, False, False)_get_param_groups name module.module.decoder.layers.21.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.14.mlp.linear_fc1.weight lr_decay_rate 0.3486784401000001 _get_param_groups name module.module.decoder.layers.10.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.15.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.16.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.20.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.5.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.36.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.mlp.linear_fc2.weight key (1.0, 0.05314410000000001, False, False) _get_param_groups name module.module.decoder.layers.21.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.21.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.11.self_attention.linear_proj.bias lr_decay_rate 0.2541865828329001 name module.module.external_feature_model.vit.decoder.layers.19.mlp.linear_fc1.weight lr_decay_rate 0.5904900000000001 _get_param_groups name module.module.decoder.layers.16.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.17.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.mlp.linear_fc1.weight key (1.0, 0.03486784401000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.ls1 key (0.0, 0.00984770902183612, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.self_attention.linear_proj.bias key (0.0, 0.02541865828329001, False, False) _get_param_groups name module.module.decoder.layers.10.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.21.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.16.mlp.linear_fc2.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.9.mlp.linear_fc1.weight lr_decay_rate 0.20589113209464907_get_param_groups name module.module.decoder.layers.15.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.17.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.5.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.20.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.21.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.18.mlp.linear_fc2.bias lr_decay_rate 0.531441_get_param_groups name module.module.decoder.layers.16.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.37.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.mlp.linear_fc1.weight key (1.0, 0.05904900000000001, False, False) name module.module.external_feature_model.vit.decoder.layers.2.ls2 lr_decay_rate 0.09847709021836118name module.module.external_feature_model.vit.decoder.layers.11.self_attention.linear_qkv.weight lr_decay_rate 0.2541865828329001 _get_param_groups name module.module.decoder.layers.11.input_layernorm.weight key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.14.mlp.linear_fc1.bias lr_decay_rate 0.3486784401000001 _get_param_groups name module.module.decoder.layers.21.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.17.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.16.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.mlp.linear_fc1.weight key (1.0, 0.02058911320946491, False, False)_get_param_groups name module.module.decoder.layers.15.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.18.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.5.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.21.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.mlp.linear_fc2.bias key (0.0, 0.05314410000000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.mlp.linear_fc1.bias key (0.0, 0.03486784401000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.ls2 key (0.0, 0.00984770902183612, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.self_attention.linear_qkv.weight key (1.0, 0.02541865828329001, False, False)_get_param_groups name module.module.decoder.layers.21.mlp.linear_fc1.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.19.mlp.linear_fc1.bias lr_decay_rate 0.5904900000000001_get_param_groups name module.module.decoder.layers.37.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.17.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.16.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.11.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.21.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.15.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.9.mlp.linear_fc1.bias lr_decay_rate 0.20589113209464907 _get_param_groups name module.module.decoder.layers.5.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.18.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.21.self_attention.linear_proj.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.14.mlp.linear_fc2.weight lr_decay_rate 0.3486784401000001name module.module.external_feature_model.vit.decoder.layers.19.ls1 lr_decay_rate 0.5904900000000001 name module.module.external_feature_model.vit.decoder.layers.11.self_attention.linear_qkv.bias lr_decay_rate 0.2541865828329001_get_param_groups name module.module.decoder.layers.17.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.21.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.mlp.linear_fc1.bias key (0.0, 0.05904900000000001, False, False) name module.module.external_feature_model.vit.decoder.layers.2.input_layernorm.weight lr_decay_rate 0.09847709021836118 _get_param_groups name module.module.decoder.layers.37.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.6.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.mlp.linear_fc1.bias key (0.0, 0.02058911320946491, False, False) _get_param_groups name module.module.decoder.layers.18.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.15.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.16.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.11.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.17.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.21.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.22.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.mlp.linear_fc2.weight key (1.0, 0.03486784401000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.ls1 key (0.0, 0.05904900000000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.self_attention.linear_qkv.bias key (0.0, 0.02541865828329001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.input_layernorm.weight key (0.0, 0.00984770902183612, False, False) _get_param_groups name module.module.decoder.layers.22.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.37.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.19.mlp.linear_fc2.weight lr_decay_rate 0.5904900000000001 _get_param_groups name module.module.decoder.layers.18.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.6.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.16.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.21.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.9.mlp.linear_fc2.weight lr_decay_rate 0.20589113209464907_get_param_groups name module.module.decoder.layers.15.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.11.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.17.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.22.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.22.self_attention.linear_proj.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.14.mlp.linear_fc2.bias lr_decay_rate 0.3486784401000001 name module.module.external_feature_model.vit.decoder.layers.19.ls2 lr_decay_rate 0.5904900000000001 name module.module.external_feature_model.vit.decoder.layers.2.input_layernorm.bias lr_decay_rate 0.09847709021836118 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.mlp.linear_fc2.weight key (1.0, 0.05904900000000001, False, False)_get_param_groups name module.module.decoder.layers.37.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.11.pre_mlp_layernorm.weight lr_decay_rate 0.2541865828329001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.mlp.linear_fc2.weight key (1.0, 0.02058911320946491, False, False) _get_param_groups name module.module.decoder.layers.17.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.6.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.17.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.11.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.18.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.15.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.22.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.21.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.mlp.linear_fc2.bias key (0.0, 0.03486784401000001, False, False) _get_param_groups name module.module.decoder.layers.22.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.ls2 key (0.0, 0.05904900000000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.input_layernorm.bias key (0.0, 0.00984770902183612, False, False) name module.module.external_feature_model.vit.decoder.layers.19.mlp.linear_fc2.bias lr_decay_rate 0.5904900000000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.pre_mlp_layernorm.weight key (0.0, 0.02541865828329001, False, False) name module.module.external_feature_model.vit.decoder.layers.9.mlp.linear_fc2.bias lr_decay_rate 0.20589113209464907_get_param_groups name module.module.decoder.layers.37.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.17.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.21.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.17.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.22.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.16.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.6.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.11.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.mlp.linear_fc2.bias key (0.0, 0.05904900000000001, False, False) _get_param_groups name module.module.decoder.layers.18.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.22.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.15.ls1 lr_decay_rate 0.3874204890000001 _get_param_groups name module.module.decoder.layers.37.mlp.linear_fc2.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.19.input_layernorm.weight lr_decay_rate 0.5904900000000001name module.module.external_feature_model.vit.decoder.layers.11.pre_mlp_layernorm.bias lr_decay_rate 0.2541865828329001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.mlp.linear_fc2.bias key (0.0, 0.02058911320946491, False, False) name module.module.external_feature_model.vit.decoder.layers.2.self_attention.linear_proj.weight lr_decay_rate 0.09847709021836118 _get_param_groups name module.module.decoder.layers.21.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.18.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.18.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.17.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.22.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.16.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.11.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.6.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.input_layernorm.weight key (0.0, 0.05904900000000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.ls1 key (0.0, 0.03874204890000001, False, False) _get_param_groups name module.module.decoder.layers.22.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.20.ls1 lr_decay_rate 0.6561_get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.pre_mlp_layernorm.bias key (0.0, 0.02541865828329001, False, False)name module.module.external_feature_model.vit.decoder.layers.10.ls1 lr_decay_rate 0.2287679245496101_get_param_groups name module.module.decoder.layers.22.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.38.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.self_attention.linear_proj.weight key (1.0, 0.00984770902183612, False, False) _get_param_groups name module.module.decoder.layers.22.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.18.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.6.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.17.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.19.input_layernorm.weight key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.19.input_layernorm.bias lr_decay_rate 0.5904900000000001_get_param_groups name module.module.decoder.layers.12.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.16.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.ls1 key (0.0, 0.06561, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.ls1 key (0.0, 0.02287679245496101, False, False) name module.module.external_feature_model.vit.decoder.layers.15.ls2 lr_decay_rate 0.3874204890000001name module.module.external_feature_model.vit.decoder.layers.2.self_attention.linear_proj.bias lr_decay_rate 0.09847709021836118 name module.module.external_feature_model.vit.decoder.layers.11.mlp.linear_fc1.weight lr_decay_rate 0.2541865828329001 _get_param_groups name module.module.decoder.layers.22.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.22.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.22.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.38.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.ls2 key (0.0, 0.03874204890000001, False, False) _get_param_groups name module.module.decoder.layers.18.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.6.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.input_layernorm.bias key (0.0, 0.05904900000000001, False, False) _get_param_groups name module.module.decoder.layers.17.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.self_attention.linear_proj.bias key (0.0, 0.00984770902183612, False, False) name module.module.external_feature_model.vit.decoder.layers.20.ls2 lr_decay_rate 0.6561_get_param_groups name module.module.decoder.layers.16.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.19.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.12.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.mlp.linear_fc1.weight key (1.0, 0.02541865828329001, False, False)_get_param_groups name module.module.decoder.layers.23.input_layernorm.weight key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.10.ls2 lr_decay_rate 0.2287679245496101 name module.module.external_feature_model.vit.decoder.layers.15.input_layernorm.weight lr_decay_rate 0.3874204890000001_get_param_groups name module.module.decoder.layers.22.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.17.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.22.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.38.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.18.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.7.input_layernorm.weight key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.19.self_attention.linear_proj.weight lr_decay_rate 0.5904900000000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.ls2 key (0.0, 0.02287679245496101, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.ls2 key (0.0, 0.06561, False, False)name module.module.external_feature_model.vit.decoder.layers.2.self_attention.linear_qkv.weight lr_decay_rate 0.09847709021836118 _get_param_groups name module.module.decoder.layers.23.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.19.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.12.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.11.mlp.linear_fc1.bias lr_decay_rate 0.2541865828329001 _get_param_groups name module.module.decoder.layers.16.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.input_layernorm.weight key (0.0, 0.03874204890000001, False, False)_get_param_groups name module.module.decoder.layers.17.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.22.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.23.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.38.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.10.input_layernorm.weight lr_decay_rate 0.2287679245496101_get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.self_attention.linear_proj.weight key (1.0, 0.05904900000000001, False, False)_get_param_groups name module.module.decoder.layers.18.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.7.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.self_attention.linear_qkv.weight key (1.0, 0.00984770902183612, False, False)name module.module.external_feature_model.vit.decoder.layers.20.input_layernorm.weight lr_decay_rate 0.6561 _get_param_groups name module.module.decoder.layers.23.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.19.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.12.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.mlp.linear_fc1.bias key (0.0, 0.02541865828329001, False, False)_get_param_groups name module.module.decoder.layers.16.mlp.linear_fc1.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.15.input_layernorm.bias lr_decay_rate 0.3874204890000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.input_layernorm.weight key (0.0, 0.02287679245496101, False, False) _get_param_groups name module.module.decoder.layers.18.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.input_layernorm.weight key (0.0, 0.06561, False, False)_get_param_groups name module.module.decoder.layers.38.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.19.self_attention.linear_proj.bias lr_decay_rate 0.5904900000000001_get_param_groups name module.module.decoder.layers.22.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.23.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.18.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.16.mlp.linear_fc2.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.2.self_attention.linear_qkv.bias lr_decay_rate 0.09847709021836118name module.module.external_feature_model.vit.decoder.layers.11.mlp.linear_fc2.weight lr_decay_rate 0.2541865828329001 name module.module.external_feature_model.vit.decoder.layers.10.input_layernorm.bias lr_decay_rate 0.2287679245496101_get_param_groups name module.module.decoder.layers.23.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.7.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.input_layernorm.bias key (0.0, 0.03874204890000001, False, False)name module.module.external_feature_model.vit.decoder.layers.20.input_layernorm.bias lr_decay_rate 0.6561 _get_param_groups name module.module.decoder.layers.19.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.12.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.23.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.mlp.linear_fc2.weight key (1.0, 0.02541865828329001, False, False)_get_param_groups name module.module.decoder.layers.18.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.input_layernorm.bias key (0.0, 0.02287679245496101, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.self_attention.linear_proj.bias key (0.0, 0.05904900000000001, False, False)_get_param_groups name module.module.decoder.layers.38.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.19.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.7.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.22.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.18.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.self_attention.linear_qkv.bias key (0.0, 0.00984770902183612, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.input_layernorm.bias key (0.0, 0.06561, False, False) _get_param_groups name module.module.decoder.layers.12.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.23.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.17.input_layernorm.weight key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.15.self_attention.linear_proj.weight lr_decay_rate 0.3874204890000001_get_param_groups name module.module.decoder.layers.38.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.18.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.11.mlp.linear_fc2.bias lr_decay_rate 0.2541865828329001_get_param_groups name module.module.decoder.layers.23.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.12.mlp.linear_fc2.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.19.self_attention.linear_qkv.weight lr_decay_rate 0.5904900000000001 name module.module.external_feature_model.vit.decoder.layers.10.self_attention.linear_proj.weight lr_decay_rate 0.2287679245496101_get_param_groups name module.module.decoder.layers.19.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.22.mlp.linear_fc2.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.2.pre_mlp_layernorm.weight lr_decay_rate 0.09847709021836118_get_param_groups name module.module.decoder.layers.23.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.19.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.7.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.self_attention.linear_proj.weight key (1.0, 0.03874204890000001, False, False)_get_param_groups name module.module.decoder.layers.39.input_layernorm.weight key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.20.self_attention.linear_proj.weight lr_decay_rate 0.6561_get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.mlp.linear_fc2.bias key (0.0, 0.02541865828329001, False, False) _get_param_groups name module.module.decoder.layers.18.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.self_attention.linear_qkv.weight key (1.0, 0.05904900000000001, False, False) _get_param_groups name module.module.decoder.layers.23.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.23.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.self_attention.linear_proj.weight key (1.0, 0.02287679245496101, False, False)_get_param_groups name module.module.decoder.layers.20.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.13.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.17.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.pre_mlp_layernorm.weight key (0.0, 0.00984770902183612, False, False) _get_param_groups name module.module.decoder.layers.23.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.7.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.self_attention.linear_proj.weight key (1.0, 0.06561, False, False)_get_param_groups name module.module.decoder.layers.39.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.19.self_attention.linear_proj.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.12.ls1 lr_decay_rate 0.2824295364810001 name module.module.external_feature_model.vit.decoder.layers.15.self_attention.linear_proj.bias lr_decay_rate 0.3874204890000001 name module.module.external_feature_model.vit.decoder.layers.19.self_attention.linear_qkv.bias lr_decay_rate 0.5904900000000001 _get_param_groups name module.module.decoder.layers.18.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.24.input_layernorm.weight key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.2.pre_mlp_layernorm.bias lr_decay_rate 0.09847709021836118_get_param_groups name module.module.decoder.layers.23.self_attention.linear_proj.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.10.self_attention.linear_proj.bias lr_decay_rate 0.2287679245496101 _get_param_groups name module.module.decoder.layers.23.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.20.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.17.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.ls1 key (0.0, 0.028242953648100012, False, False) _get_param_groups name module.module.decoder.layers.13.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.19.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.self_attention.linear_proj.bias key (0.0, 0.03874204890000001, False, False) _get_param_groups name module.module.decoder.layers.7.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.self_attention.linear_qkv.bias key (0.0, 0.05904900000000001, False, False)name module.module.external_feature_model.vit.decoder.layers.20.self_attention.linear_proj.bias lr_decay_rate 0.6561_get_param_groups name module.module.decoder.layers.39.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.pre_mlp_layernorm.bias key (0.0, 0.00984770902183612, False, False)_get_param_groups name module.module.decoder.layers.17.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.18.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.23.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.self_attention.linear_proj.bias key (0.0, 0.02287679245496101, False, False) _get_param_groups name module.module.decoder.layers.24.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.23.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.20.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.19.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.12.ls2 lr_decay_rate 0.2824295364810001 _get_param_groups name module.module.decoder.layers.13.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.15.self_attention.linear_qkv.weight lr_decay_rate 0.3874204890000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.self_attention.linear_proj.bias key (0.0, 0.06561, False, False) _get_param_groups name module.module.decoder.layers.8.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.23.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.2.mlp.linear_fc1.weight lr_decay_rate 0.09847709021836118_get_param_groups name module.module.decoder.layers.39.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.19.pre_mlp_layernorm.weight lr_decay_rate 0.5904900000000001_get_param_groups name module.module.decoder.layers.17.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.10.self_attention.linear_qkv.weight lr_decay_rate 0.2287679245496101_get_param_groups name module.module.decoder.layers.24.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.18.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.self_attention.linear_qkv.weight key (1.0, 0.03874204890000001, False, False)_get_param_groups name module.module.decoder.layers.24.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.20.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.19.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.ls2 key (0.0, 0.028242953648100012, False, False) _get_param_groups name module.module.decoder.layers.13.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.20.self_attention.linear_qkv.weight lr_decay_rate 0.6561_get_param_groups name module.module.decoder.layers.23.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.self_attention.linear_qkv.weight key (1.0, 0.02287679245496101, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.mlp.linear_fc1.weight key (1.0, 0.00984770902183612, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.pre_mlp_layernorm.weight key (0.0, 0.05904900000000001, False, False) name module.module.external_feature_model.vit.decoder.layers.15.self_attention.linear_qkv.bias lr_decay_rate 0.3874204890000001_get_param_groups name module.module.decoder.layers.8.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.19.input_layernorm.weight key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.12.input_layernorm.weight lr_decay_rate 0.2824295364810001_get_param_groups name module.module.decoder.layers.17.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.24.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.20.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.39.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.24.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.23.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.19.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.13.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.19.pre_mlp_layernorm.bias lr_decay_rate 0.5904900000000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.self_attention.linear_qkv.weight key (1.0, 0.06561, False, False) name module.module.external_feature_model.vit.decoder.layers.2.mlp.linear_fc1.bias lr_decay_rate 0.09847709021836118_get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.self_attention.linear_qkv.bias key (0.0, 0.03874204890000001, False, False)name module.module.external_feature_model.vit.decoder.layers.10.self_attention.linear_qkv.bias lr_decay_rate 0.2287679245496101 _get_param_groups name module.module.decoder.layers.20.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.8.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.19.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.pre_mlp_layernorm.bias key (0.0, 0.05904900000000001, False, False)_get_param_groups name module.module.decoder.layers.24.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.input_layernorm.weight key (0.0, 0.028242953648100012, False, False)_get_param_groups name module.module.decoder.layers.24.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.23.mlp.linear_fc2.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.20.self_attention.linear_qkv.bias lr_decay_rate 0.6561 _get_param_groups name module.module.decoder.layers.13.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.17.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.39.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.self_attention.linear_qkv.bias key (0.0, 0.02287679245496101, False, False)_get_param_groups name module.module.decoder.layers.19.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.mlp.linear_fc1.bias key (0.0, 0.00984770902183612, False, False)_get_param_groups name module.module.decoder.layers.19.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.15.pre_mlp_layernorm.weight lr_decay_rate 0.3874204890000001 _get_param_groups name module.module.decoder.layers.24.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.20.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.8.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.12.input_layernorm.bias lr_decay_rate 0.2824295364810001_get_param_groups name module.module.decoder.layers.24.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.24.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.19.mlp.linear_fc1.weight lr_decay_rate 0.5904900000000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.self_attention.linear_qkv.bias key (0.0, 0.06561, False, False) _get_param_groups name module.module.decoder.layers.13.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.pre_mlp_layernorm.weight key (0.0, 0.03874204890000001, False, False)_get_param_groups name module.module.decoder.layers.18.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.20.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.19.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.2.mlp.linear_fc2.weight lr_decay_rate 0.09847709021836118_get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.input_layernorm.bias key (0.0, 0.028242953648100012, False, False) _get_param_groups name module.module.decoder.layers.21.input_layernorm.weight key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.10.pre_mlp_layernorm.weight lr_decay_rate 0.2287679245496101_get_param_groups name module.module.decoder.layers.39.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.24.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.24.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.mlp.linear_fc1.weight key (1.0, 0.05904900000000001, False, False)_get_param_groups name module.module.decoder.layers.8.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.15.pre_mlp_layernorm.bias lr_decay_rate 0.3874204890000001 _get_param_groups name module.module.decoder.layers.14.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.24.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.18.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.20.self_attention.linear_proj.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.20.pre_mlp_layernorm.weight lr_decay_rate 0.6561 _get_param_groups name module.module.decoder.layers.19.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.pre_mlp_layernorm.weight key (0.0, 0.02287679245496101, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.mlp.linear_fc2.weight key (1.0, 0.00984770902183612, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.pre_mlp_layernorm.bias key (0.0, 0.03874204890000001, False, False)name module.module.external_feature_model.vit.decoder.layers.19.mlp.linear_fc1.bias lr_decay_rate 0.5904900000000001 _get_param_groups name module.module.decoder.layers.21.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.24.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.25.input_layernorm.weight key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.12.self_attention.linear_proj.weight lr_decay_rate 0.2824295364810001 _get_param_groups name module.module.decoder.layers.40.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.24.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.8.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.18.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.14.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.20.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.pre_mlp_layernorm.weight key (0.0, 0.06561, False, False) name module.module.external_feature_model.vit.decoder.layers.10.pre_mlp_layernorm.bias lr_decay_rate 0.2287679245496101_get_param_groups name module.module.decoder.layers.19.mlp.linear_fc1.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.2.mlp.linear_fc2.bias lr_decay_rate 0.09847709021836118name module.module.external_feature_model.vit.decoder.layers.15.mlp.linear_fc1.weight lr_decay_rate 0.3874204890000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.mlp.linear_fc1.bias key (0.0, 0.05904900000000001, False, False) _get_param_groups name module.module.decoder.layers.24.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.21.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.self_attention.linear_proj.weight key (1.0, 0.028242953648100012, False, False) _get_param_groups name module.module.decoder.layers.20.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.8.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.25.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.18.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.14.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.24.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.mlp.linear_fc1.weight key (1.0, 0.03874204890000001, False, False) name module.module.external_feature_model.vit.decoder.layers.20.pre_mlp_layernorm.bias lr_decay_rate 0.6561_get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.pre_mlp_layernorm.bias key (0.0, 0.02287679245496101, False, False) name module.module.external_feature_model.vit.decoder.layers.12.self_attention.linear_proj.bias lr_decay_rate 0.2824295364810001 _get_param_groups name module.module.decoder.layers.40.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.2.mlp.linear_fc2.bias key (0.0, 0.00984770902183612, False, False)_get_param_groups name module.module.decoder.layers.19.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.21.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.24.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.19.mlp.linear_fc2.weight lr_decay_rate 0.5904900000000001_get_param_groups name module.module.decoder.layers.25.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.9.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.14.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.20.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.18.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.self_attention.linear_proj.bias key (0.0, 0.028242953648100012, False, False)_get_param_groups name module.module.decoder.layers.25.input_layernorm.weight key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.15.mlp.linear_fc1.bias lr_decay_rate 0.3874204890000001name module.module.external_feature_model.vit.decoder.layers.3.ls1 lr_decay_rate 0.10941898913151242 _get_param_groups name module.module.decoder.layers.20.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.pre_mlp_layernorm.bias key (0.0, 0.06561, False, False) name module.module.external_feature_model.vit.decoder.layers.10.mlp.linear_fc1.weight lr_decay_rate 0.2287679245496101 _get_param_groups name module.module.decoder.layers.24.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.40.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.mlp.linear_fc2.weight key (1.0, 0.05904900000000001, False, False)_get_param_groups name module.module.decoder.layers.25.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.18.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.21.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.20.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.9.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.mlp.linear_fc1.bias key (0.0, 0.03874204890000001, False, False) name module.module.external_feature_model.vit.decoder.layers.12.self_attention.linear_qkv.weight lr_decay_rate 0.2824295364810001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.ls1 key (0.0, 0.010941898913151242, False, False) name module.module.external_feature_model.vit.decoder.layers.20.mlp.linear_fc1.weight lr_decay_rate 0.6561_get_param_groups name module.module.decoder.layers.14.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.24.mlp.linear_fc2.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.19.mlp.linear_fc2.bias lr_decay_rate 0.5904900000000001_get_param_groups name module.module.decoder.layers.40.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.25.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.25.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.mlp.linear_fc1.weight key (1.0, 0.02287679245496101, False, False) _get_param_groups name module.module.decoder.layers.20.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.18.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.21.mlp.linear_fc1.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.3.ls2 lr_decay_rate 0.10941898913151242_get_param_groups name module.module.decoder.layers.20.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.14.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.self_attention.linear_qkv.weight key (1.0, 0.028242953648100012, False, False)_get_param_groups name module.module.decoder.layers.25.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.25.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.9.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.15.mlp.linear_fc2.weight lr_decay_rate 0.3874204890000001 _get_param_groups name module.module.decoder.layers.25.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.mlp.linear_fc1.weight key (1.0, 0.06561, False, False)name module.module.external_feature_model.vit.decoder.layers.10.mlp.linear_fc1.bias lr_decay_rate 0.2287679245496101_get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.mlp.linear_fc2.bias key (0.0, 0.05904900000000001, False, False) _get_param_groups name module.module.decoder.layers.20.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.21.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.21.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.40.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.19.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.ls2 key (0.0, 0.010941898913151242, False, False) _get_param_groups name module.module.decoder.layers.9.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.25.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.25.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.14.mlp.linear_fc2.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.12.self_attention.linear_qkv.bias lr_decay_rate 0.2824295364810001 name module.module.external_feature_model.vit.decoder.layers.20.ls1 lr_decay_rate 0.6561_get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.mlp.linear_fc2.weight key (1.0, 0.03874204890000001, False, False) _get_param_groups name module.module.decoder.layers.25.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.mlp.linear_fc1.bias key (0.0, 0.02287679245496101, False, False)name module.module.external_feature_model.vit.decoder.layers.20.mlp.linear_fc1.bias lr_decay_rate 0.6561 _get_param_groups name module.module.decoder.layers.20.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.19.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.25.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.22.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.9.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.21.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.40.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.self_attention.linear_qkv.bias key (0.0, 0.028242953648100012, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.mlp.linear_fc1.bias key (0.0, 0.06561, False, False)name module.module.external_feature_model.vit.decoder.layers.3.input_layernorm.weight lr_decay_rate 0.10941898913151242 _get_param_groups name module.module.decoder.layers.25.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.15.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.ls1 key (0.0, 0.06561, False, False)name module.module.external_feature_model.vit.decoder.layers.10.mlp.linear_fc2.weight lr_decay_rate 0.2287679245496101 _get_param_groups name module.module.decoder.layers.26.input_layernorm.weight key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.15.mlp.linear_fc2.bias lr_decay_rate 0.3874204890000001 _get_param_groups name module.module.decoder.layers.21.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.20.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.22.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.19.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.25.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.15.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.25.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.20.mlp.linear_fc2.weight lr_decay_rate 0.6561_get_param_groups name module.module.decoder.layers.9.mlp.linear_fc1.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.20.ls2 lr_decay_rate 0.6561_get_param_groups name module.module.decoder.layers.40.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.input_layernorm.weight key (0.0, 0.010941898913151242, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.mlp.linear_fc2.weight key (1.0, 0.02287679245496101, False, False) _get_param_groups name module.module.decoder.layers.26.self_attention.linear_proj.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.12.pre_mlp_layernorm.weight lr_decay_rate 0.2824295364810001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.mlp.linear_fc2.bias key (0.0, 0.03874204890000001, False, False)_get_param_groups name module.module.decoder.layers.21.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.22.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.20.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.25.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.19.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.25.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.9.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.15.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.mlp.linear_fc2.weight key (1.0, 0.06561, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.ls2 key (0.0, 0.06561, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.pre_mlp_layernorm.weight key (0.0, 0.028242953648100012, False, False) _get_param_groups name module.module.decoder.layers.20.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.41.input_layernorm.weight key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.3.input_layernorm.bias lr_decay_rate 0.10941898913151242 name module.module.external_feature_model.vit.decoder.layers.10.mlp.linear_fc2.bias lr_decay_rate 0.2287679245496101 _get_param_groups name module.module.decoder.layers.26.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.25.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.10.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.22.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.16.ls1 lr_decay_rate 0.4304672100000001 _get_param_groups name module.module.decoder.layers.21.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.19.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.15.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.12.pre_mlp_layernorm.bias lr_decay_rate 0.2824295364810001name module.module.external_feature_model.vit.decoder.layers.20.mlp.linear_fc2.bias lr_decay_rate 0.6561 name module.module.external_feature_model.vit.decoder.layers.20.input_layernorm.weight lr_decay_rate 0.6561 _get_param_groups name module.module.decoder.layers.26.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.26.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.21.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.input_layernorm.bias key (0.0, 0.010941898913151242, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.mlp.linear_fc2.bias key (0.0, 0.02287679245496101, False, False) _get_param_groups name module.module.decoder.layers.41.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.25.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.ls1 key (0.0, 0.04304672100000001, False, False) _get_param_groups name module.module.decoder.layers.10.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.21.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.22.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.pre_mlp_layernorm.bias key (0.0, 0.028242953648100012, False, False)_get_param_groups name module.module.decoder.layers.19.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.mlp.linear_fc2.bias key (0.0, 0.06561, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.input_layernorm.weight key (0.0, 0.06561, False, False)_get_param_groups name module.module.decoder.layers.26.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.41.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.15.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.11.ls1 lr_decay_rate 0.2541865828329001_get_param_groups name module.module.decoder.layers.26.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.21.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.26.input_layernorm.weight key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.16.ls2 lr_decay_rate 0.4304672100000001name module.module.external_feature_model.vit.decoder.layers.3.self_attention.linear_proj.weight lr_decay_rate 0.10941898913151242 _get_param_groups name module.module.decoder.layers.21.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.26.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.10.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.19.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.41.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.20.input_layernorm.bias lr_decay_rate 0.6561 name module.module.external_feature_model.vit.decoder.layers.21.ls1 lr_decay_rate 0.7290000000000001 _get_param_groups name module.module.decoder.layers.22.mlp.linear_fc1.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.12.mlp.linear_fc1.weight lr_decay_rate 0.2824295364810001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.ls2 key (0.0, 0.04304672100000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.ls1 key (0.0, 0.02541865828329001, False, False)_get_param_groups name module.module.decoder.layers.15.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.21.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.26.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.input_layernorm.bias key (0.0, 0.06561, False, False) _get_param_groups name module.module.decoder.layers.22.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.10.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.20.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.26.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.self_attention.linear_proj.weight key (1.0, 0.010941898913151242, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.ls1 key (0.0, 0.0729, False, False)_get_param_groups name module.module.decoder.layers.26.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.mlp.linear_fc1.weight key (1.0, 0.028242953648100012, False, False) name module.module.external_feature_model.vit.decoder.layers.16.input_layernorm.weight lr_decay_rate 0.4304672100000001name module.module.external_feature_model.vit.decoder.layers.11.ls2 lr_decay_rate 0.2541865828329001_get_param_groups name module.module.decoder.layers.41.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.22.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.22.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.15.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.26.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.21.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.20.self_attention.linear_proj.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.21.ls2 lr_decay_rate 0.7290000000000001 name module.module.external_feature_model.vit.decoder.layers.20.self_attention.linear_proj.weight lr_decay_rate 0.6561 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.ls2 key (0.0, 0.02541865828329001, False, False)_get_param_groups name module.module.decoder.layers.26.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.10.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.3.self_attention.linear_proj.bias lr_decay_rate 0.10941898913151242 name module.module.external_feature_model.vit.decoder.layers.12.mlp.linear_fc1.bias lr_decay_rate 0.2824295364810001 _get_param_groups name module.module.decoder.layers.41.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.input_layernorm.weight key (0.0, 0.04304672100000001, False, False)_get_param_groups name module.module.decoder.layers.26.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.22.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.16.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.23.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.ls2 key (0.0, 0.0729, False, False) _get_param_groups name module.module.decoder.layers.27.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.self_attention.linear_proj.weight key (1.0, 0.06561, False, False)_get_param_groups name module.module.decoder.layers.20.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.21.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.26.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.self_attention.linear_proj.bias key (0.0, 0.010941898913151242, False, False)name module.module.external_feature_model.vit.decoder.layers.11.input_layernorm.weight lr_decay_rate 0.2541865828329001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.mlp.linear_fc1.bias key (0.0, 0.028242953648100012, False, False) _get_param_groups name module.module.decoder.layers.26.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.10.mlp.linear_fc1.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.16.input_layernorm.bias lr_decay_rate 0.4304672100000001 _get_param_groups name module.module.decoder.layers.22.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.41.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.27.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.20.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.16.self_attention.linear_proj.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.21.input_layernorm.weight lr_decay_rate 0.7290000000000001 name module.module.external_feature_model.vit.decoder.layers.20.self_attention.linear_proj.bias lr_decay_rate 0.6561 _get_param_groups name module.module.decoder.layers.23.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.26.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.21.mlp.linear_fc1.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.3.self_attention.linear_qkv.weight lr_decay_rate 0.10941898913151242_get_param_groups name module.module.decoder.layers.42.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.input_layernorm.weight key (0.0, 0.02541865828329001, False, False)name module.module.external_feature_model.vit.decoder.layers.12.mlp.linear_fc2.weight lr_decay_rate 0.2824295364810001_get_param_groups name module.module.decoder.layers.10.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.input_layernorm.bias key (0.0, 0.04304672100000001, False, False) _get_param_groups name module.module.decoder.layers.26.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.22.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.27.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.16.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.20.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.27.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.self_attention.linear_proj.bias key (0.0, 0.06561, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.input_layernorm.weight key (0.0, 0.0729, False, False)_get_param_groups name module.module.decoder.layers.23.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.21.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.mlp.linear_fc2.weight key (1.0, 0.028242953648100012, False, False)_get_param_groups name module.module.decoder.layers.11.input_layernorm.weight key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.11.input_layernorm.bias lr_decay_rate 0.2541865828329001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.self_attention.linear_qkv.weight key (1.0, 0.010941898913151242, False, False) _get_param_groups name module.module.decoder.layers.22.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.23.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.42.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.26.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.27.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.16.self_attention.linear_proj.weight lr_decay_rate 0.4304672100000001 _get_param_groups name module.module.decoder.layers.16.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.20.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.27.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.22.input_layernorm.weight key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.20.self_attention.linear_qkv.weight lr_decay_rate 0.6561 name module.module.external_feature_model.vit.decoder.layers.21.input_layernorm.bias lr_decay_rate 0.7290000000000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.input_layernorm.bias key (0.0, 0.02541865828329001, False, False)name module.module.external_feature_model.vit.decoder.layers.12.mlp.linear_fc2.bias lr_decay_rate 0.2824295364810001 _get_param_groups name module.module.decoder.layers.22.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.23.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.3.self_attention.linear_qkv.bias lr_decay_rate 0.10941898913151242 _get_param_groups name module.module.decoder.layers.42.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.11.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.self_attention.linear_qkv.weight key (1.0, 0.06561, False, False) _get_param_groups name module.module.decoder.layers.26.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.27.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.20.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.self_attention.linear_proj.weight key (1.0, 0.04304672100000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.input_layernorm.bias key (0.0, 0.0729, False, False) _get_param_groups name module.module.decoder.layers.22.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.27.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.16.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.mlp.linear_fc2.bias key (0.0, 0.028242953648100012, False, False) _get_param_groups name module.module.decoder.layers.23.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.23.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.self_attention.linear_qkv.bias key (0.0, 0.010941898913151242, False, False) name module.module.external_feature_model.vit.decoder.layers.11.self_attention.linear_proj.weight lr_decay_rate 0.2541865828329001name module.module.external_feature_model.vit.decoder.layers.20.self_attention.linear_qkv.bias lr_decay_rate 0.6561_get_param_groups name module.module.decoder.layers.16.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.42.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.27.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.27.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.11.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.27.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.21.input_layernorm.weight key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.16.self_attention.linear_proj.bias lr_decay_rate 0.4304672100000001name module.module.external_feature_model.vit.decoder.layers.13.ls1 lr_decay_rate 0.31381059609000006 _get_param_groups name module.module.decoder.layers.22.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.21.self_attention.linear_proj.weight lr_decay_rate 0.7290000000000001_get_param_groups name module.module.decoder.layers.23.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.23.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.self_attention.linear_qkv.bias key (0.0, 0.06561, False, False) _get_param_groups name module.module.decoder.layers.16.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.self_attention.linear_proj.weight key (1.0, 0.02541865828329001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.self_attention.linear_proj.bias key (0.0, 0.04304672100000001, False, False) _get_param_groups name module.module.decoder.layers.11.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.3.pre_mlp_layernorm.weight lr_decay_rate 0.10941898913151242_get_param_groups name module.module.decoder.layers.27.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.42.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.ls1 key (0.0, 0.031381059609000006, False, False)_get_param_groups name module.module.decoder.layers.23.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.27.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.24.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.22.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.27.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.11.self_attention.linear_proj.bias lr_decay_rate 0.2541865828329001 name module.module.external_feature_model.vit.decoder.layers.16.self_attention.linear_qkv.weight lr_decay_rate 0.4304672100000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.pre_mlp_layernorm.weight key (0.0, 0.010941898913151242, False, False)_get_param_groups name module.module.decoder.layers.21.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.self_attention.linear_proj.weight key (1.0, 0.0729, False, False) _get_param_groups name module.module.decoder.layers.17.input_layernorm.weight key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.20.pre_mlp_layernorm.weight lr_decay_rate 0.6561 _get_param_groups name module.module.decoder.layers.28.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.27.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.11.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.24.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.22.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.42.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.self_attention.linear_proj.bias key (0.0, 0.02541865828329001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.self_attention.linear_qkv.weight key (1.0, 0.04304672100000001, False, False) _get_param_groups name module.module.decoder.layers.23.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.27.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.13.ls2 lr_decay_rate 0.31381059609000006_get_param_groups name module.module.decoder.layers.27.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.21.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.3.pre_mlp_layernorm.bias lr_decay_rate 0.10941898913151242_get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.pre_mlp_layernorm.weight key (0.0, 0.06561, False, False) name module.module.external_feature_model.vit.decoder.layers.21.self_attention.linear_proj.bias lr_decay_rate 0.7290000000000001_get_param_groups name module.module.decoder.layers.11.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.17.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.28.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.42.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.24.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.ls2 key (0.0, 0.031381059609000006, False, False)_get_param_groups name module.module.decoder.layers.22.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.27.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.11.self_attention.linear_qkv.weight lr_decay_rate 0.2541865828329001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.pre_mlp_layernorm.bias key (0.0, 0.010941898913151242, False, False) _get_param_groups name module.module.decoder.layers.27.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.21.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.23.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.16.self_attention.linear_qkv.bias lr_decay_rate 0.4304672100000001_get_param_groups name module.module.decoder.layers.11.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.28.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.self_attention.linear_proj.bias key (0.0, 0.0729, False, False) name module.module.external_feature_model.vit.decoder.layers.20.pre_mlp_layernorm.bias lr_decay_rate 0.6561 _get_param_groups name module.module.decoder.layers.24.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.17.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.43.input_layernorm.weight key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.13.input_layernorm.weight lr_decay_rate 0.31381059609000006_get_param_groups name module.module.decoder.layers.22.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.28.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.self_attention.linear_qkv.weight key (1.0, 0.02541865828329001, False, False) _get_param_groups name module.module.decoder.layers.27.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.21.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.self_attention.linear_qkv.bias key (0.0, 0.04304672100000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.pre_mlp_layernorm.bias key (0.0, 0.06561, False, False) _get_param_groups name module.module.decoder.layers.23.mlp.linear_fc1.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.3.mlp.linear_fc1.weight lr_decay_rate 0.10941898913151242 name module.module.external_feature_model.vit.decoder.layers.21.self_attention.linear_qkv.weight lr_decay_rate 0.7290000000000001 _get_param_groups name module.module.decoder.layers.28.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.17.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.12.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.24.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.input_layernorm.weight key (0.0, 0.031381059609000006, False, False) _get_param_groups name module.module.decoder.layers.43.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.23.input_layernorm.weight key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.11.self_attention.linear_qkv.bias lr_decay_rate 0.2541865828329001 _get_param_groups name module.module.decoder.layers.28.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.27.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.21.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.self_attention.linear_qkv.weight key (1.0, 0.0729, False, False) name module.module.external_feature_model.vit.decoder.layers.16.pre_mlp_layernorm.weight lr_decay_rate 0.4304672100000001 _get_param_groups name module.module.decoder.layers.23.mlp.linear_fc2.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.20.mlp.linear_fc1.weight lr_decay_rate 0.6561 _get_param_groups name module.module.decoder.layers.28.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.24.mlp.linear_fc1.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.13.input_layernorm.bias lr_decay_rate 0.31381059609000006_get_param_groups name module.module.decoder.layers.17.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.12.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.self_attention.linear_qkv.bias key (0.0, 0.02541865828329001, False, False)_get_param_groups name module.module.decoder.layers.43.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.mlp.linear_fc1.weight key (1.0, 0.010941898913151242, False, False) _get_param_groups name module.module.decoder.layers.28.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.23.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.mlp.linear_fc1.weight key (1.0, 0.06561, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.pre_mlp_layernorm.weight key (0.0, 0.04304672100000001, False, False)name module.module.external_feature_model.vit.decoder.layers.21.self_attention.linear_qkv.bias lr_decay_rate 0.7290000000000001_get_param_groups name module.module.decoder.layers.28.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.28.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.21.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.43.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.input_layernorm.bias key (0.0, 0.031381059609000006, False, False)_get_param_groups name module.module.decoder.layers.24.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.24.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.17.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.12.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.3.mlp.linear_fc1.bias lr_decay_rate 0.10941898913151242 name module.module.external_feature_model.vit.decoder.layers.11.pre_mlp_layernorm.weight lr_decay_rate 0.2541865828329001_get_param_groups name module.module.decoder.layers.28.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.23.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.self_attention.linear_qkv.bias key (0.0, 0.0729, False, False)name module.module.external_feature_model.vit.decoder.layers.20.mlp.linear_fc1.bias lr_decay_rate 0.6561_get_param_groups name module.module.decoder.layers.28.mlp.linear_fc2.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.16.pre_mlp_layernorm.bias lr_decay_rate 0.4304672100000001 _get_param_groups name module.module.decoder.layers.22.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.28.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.mlp.linear_fc1.bias key (0.0, 0.010941898913151242, False, False)_get_param_groups name module.module.decoder.layers.12.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.pre_mlp_layernorm.weight key (0.0, 0.02541865828329001, False, False)_get_param_groups name module.module.decoder.layers.25.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.24.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.17.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.43.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.28.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.13.self_attention.linear_proj.weight lr_decay_rate 0.31381059609000006 _get_param_groups name module.module.decoder.layers.29.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.mlp.linear_fc1.bias key (0.0, 0.06561, False, False)_get_param_groups name module.module.decoder.layers.23.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.pre_mlp_layernorm.bias key (0.0, 0.04304672100000001, False, False) _get_param_groups name module.module.decoder.layers.28.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.21.pre_mlp_layernorm.weight lr_decay_rate 0.7290000000000001name module.module.external_feature_model.vit.decoder.layers.3.mlp.linear_fc2.weight lr_decay_rate 0.10941898913151242 _get_param_groups name module.module.decoder.layers.22.self_attention.linear_proj.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.11.pre_mlp_layernorm.bias lr_decay_rate 0.2541865828329001_get_param_groups name module.module.decoder.layers.24.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.18.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.12.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.25.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.self_attention.linear_proj.weight key (1.0, 0.031381059609000006, False, False) _get_param_groups name module.module.decoder.layers.43.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.29.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.28.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.mlp.linear_fc2.weight key (1.0, 0.010941898913151242, False, False)name module.module.external_feature_model.vit.decoder.layers.20.mlp.linear_fc2.weight lr_decay_rate 0.6561 name module.module.external_feature_model.vit.decoder.layers.16.mlp.linear_fc1.weight lr_decay_rate 0.4304672100000001 _get_param_groups name module.module.decoder.layers.28.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.pre_mlp_layernorm.weight key (0.0, 0.0729, False, False) _get_param_groups name module.module.decoder.layers.23.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.22.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.pre_mlp_layernorm.bias key (0.0, 0.02541865828329001, False, False) _get_param_groups name module.module.decoder.layers.24.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.18.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.25.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.12.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.mlp.linear_fc2.weight key (1.0, 0.06561, False, False) name module.module.external_feature_model.vit.decoder.layers.13.self_attention.linear_proj.bias lr_decay_rate 0.31381059609000006_get_param_groups name module.module.decoder.layers.29.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.43.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.28.mlp.linear_fc2.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.3.mlp.linear_fc2.bias lr_decay_rate 0.10941898913151242_get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.mlp.linear_fc1.weight key (1.0, 0.04304672100000001, False, False)_get_param_groups name module.module.decoder.layers.23.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.28.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.11.mlp.linear_fc1.weight lr_decay_rate 0.2541865828329001 _get_param_groups name module.module.decoder.layers.22.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.25.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.21.pre_mlp_layernorm.bias lr_decay_rate 0.7290000000000001 _get_param_groups name module.module.decoder.layers.18.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.24.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.12.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.29.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.self_attention.linear_proj.bias key (0.0, 0.031381059609000006, False, False)name module.module.external_feature_model.vit.decoder.layers.20.mlp.linear_fc2.bias lr_decay_rate 0.6561 _get_param_groups name module.module.decoder.layers.23.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.29.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.pre_mlp_layernorm.bias key (0.0, 0.0729, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.3.mlp.linear_fc2.bias key (0.0, 0.010941898913151242, False, False) _get_param_groups name module.module.decoder.layers.44.input_layernorm.weight key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.16.mlp.linear_fc1.bias lr_decay_rate 0.4304672100000001 _get_param_groups name module.module.decoder.layers.28.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.mlp.linear_fc1.weight key (1.0, 0.02541865828329001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.mlp.linear_fc2.bias key (0.0, 0.06561, False, False) _get_param_groups name module.module.decoder.layers.18.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.24.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.25.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.13.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.24.input_layernorm.weight key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.21.mlp.linear_fc1.weight lr_decay_rate 0.7290000000000001 name module.module.external_feature_model.vit.decoder.layers.13.self_attention.linear_qkv.weight lr_decay_rate 0.31381059609000006 _get_param_groups name module.module.decoder.layers.22.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.29.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.29.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.mlp.linear_fc1.bias key (0.0, 0.04304672100000001, False, False)_get_param_groups name module.module.decoder.layers.24.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.44.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.28.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.mlp.linear_fc1.weight key (1.0, 0.0729, False, False) name module.module.external_feature_model.vit.decoder.layers.11.mlp.linear_fc1.bias lr_decay_rate 0.2541865828329001 name module.module.external_feature_model.vit.decoder.layers.4.ls1 lr_decay_rate 0.12157665459056935 _get_param_groups name module.module.decoder.layers.18.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.21.ls1 lr_decay_rate 0.7290000000000001 _get_param_groups name module.module.decoder.layers.25.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.self_attention.linear_qkv.weight key (1.0, 0.031381059609000006, False, False) _get_param_groups name module.module.decoder.layers.24.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.22.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.29.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.13.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.29.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.29.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.25.input_layernorm.weight key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.16.mlp.linear_fc2.weight lr_decay_rate 0.4304672100000001_get_param_groups name module.module.decoder.layers.44.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.21.mlp.linear_fc1.bias lr_decay_rate 0.7290000000000001_get_param_groups name module.module.decoder.layers.24.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.mlp.linear_fc1.bias key (0.0, 0.02541865828329001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.ls1 key (0.0, 0.0729, False, False)_get_param_groups name module.module.decoder.layers.25.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.ls1 key (0.0, 0.012157665459056936, False, False)_get_param_groups name module.module.decoder.layers.18.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.29.mlp.linear_fc2.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.13.self_attention.linear_qkv.bias lr_decay_rate 0.31381059609000006 _get_param_groups name module.module.decoder.layers.13.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.22.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.mlp.linear_fc2.weight key (1.0, 0.04304672100000001, False, False)_get_param_groups name module.module.decoder.layers.44.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.29.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.mlp.linear_fc1.bias key (0.0, 0.0729, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.self_attention.linear_qkv.bias key (0.0, 0.031381059609000006, False, False)_get_param_groups name module.module.decoder.layers.29.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.25.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.24.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.21.ls2 lr_decay_rate 0.7290000000000001_get_param_groups name module.module.decoder.layers.26.input_layernorm.weight key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.4.ls2 lr_decay_rate 0.12157665459056935name module.module.external_feature_model.vit.decoder.layers.11.mlp.linear_fc2.weight lr_decay_rate 0.2541865828329001_get_param_groups name module.module.decoder.layers.30.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.18.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.13.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.29.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.16.mlp.linear_fc2.bias lr_decay_rate 0.4304672100000001_get_param_groups name module.module.decoder.layers.23.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.44.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.25.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.29.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.21.mlp.linear_fc2.weight lr_decay_rate 0.7290000000000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.ls2 key (0.0, 0.012157665459056936, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.ls2 key (0.0, 0.0729, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.mlp.linear_fc2.weight key (1.0, 0.02541865828329001, False, False) name module.module.external_feature_model.vit.decoder.layers.13.pre_mlp_layernorm.weight lr_decay_rate 0.31381059609000006 _get_param_groups name module.module.decoder.layers.24.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.26.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.19.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.29.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.mlp.linear_fc2.bias key (0.0, 0.04304672100000001, False, False)_get_param_groups name module.module.decoder.layers.44.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.30.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.25.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.29.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.mlp.linear_fc2.weight key (1.0, 0.0729, False, False)_get_param_groups name module.module.decoder.layers.13.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.pre_mlp_layernorm.weight key (0.0, 0.031381059609000006, False, False) _get_param_groups name module.module.decoder.layers.23.self_attention.linear_proj.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.4.input_layernorm.weight lr_decay_rate 0.12157665459056935name module.module.external_feature_model.vit.decoder.layers.21.input_layernorm.weight lr_decay_rate 0.7290000000000001 name module.module.external_feature_model.vit.decoder.layers.11.mlp.linear_fc2.bias lr_decay_rate 0.2541865828329001_get_param_groups name module.module.decoder.layers.24.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.29.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.19.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.26.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.13.pre_mlp_layernorm.bias lr_decay_rate 0.31381059609000006_get_param_groups name module.module.decoder.layers.44.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.30.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.21.mlp.linear_fc2.bias lr_decay_rate 0.7290000000000001 _get_param_groups name module.module.decoder.layers.25.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.29.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.13.mlp.linear_fc1.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.17.ls1 lr_decay_rate 0.4782969000000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.mlp.linear_fc2.bias key (0.0, 0.02541865828329001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.input_layernorm.weight key (0.0, 0.012157665459056936, False, False)_get_param_groups name module.module.decoder.layers.24.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.pre_mlp_layernorm.bias key (0.0, 0.031381059609000006, False, False)_get_param_groups name module.module.decoder.layers.26.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.mlp.linear_fc2.bias key (0.0, 0.0729, False, False) _get_param_groups name module.module.decoder.layers.23.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.input_layernorm.weight key (0.0, 0.0729, False, False) _get_param_groups name module.module.decoder.layers.30.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.19.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.30.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.45.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.25.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.29.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.13.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.ls1 key (0.0, 0.04782969000000001, False, False) _get_param_groups name module.module.decoder.layers.25.input_layernorm.weight key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.4.input_layernorm.bias lr_decay_rate 0.12157665459056935_get_param_groups name module.module.decoder.layers.23.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.26.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.22.ls1 lr_decay_rate 0.81name module.module.external_feature_model.vit.decoder.layers.12.ls1 lr_decay_rate 0.2824295364810001 name module.module.external_feature_model.vit.decoder.layers.13.mlp.linear_fc1.weight lr_decay_rate 0.31381059609000006 _get_param_groups name module.module.decoder.layers.19.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.21.input_layernorm.bias lr_decay_rate 0.7290000000000001 name module.module.external_feature_model.vit.decoder.layers.17.ls2 lr_decay_rate 0.4782969000000001 _get_param_groups name module.module.decoder.layers.25.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.29.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.30.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.45.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.30.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.14.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.input_layernorm.bias key (0.0, 0.012157665459056936, False, False)_get_param_groups name module.module.decoder.layers.25.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.ls1 key (0.0, 0.028242953648100012, False, False)_get_param_groups name module.module.decoder.layers.19.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.26.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.ls1 key (0.0, 0.08100000000000002, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.mlp.linear_fc1.weight key (1.0, 0.031381059609000006, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.input_layernorm.bias key (0.0, 0.0729, False, False)_get_param_groups name module.module.decoder.layers.23.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.30.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.ls2 key (0.0, 0.04782969000000001, False, False)_get_param_groups name module.module.decoder.layers.30.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.26.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.45.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.30.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.14.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.26.mlp.linear_fc2.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.12.ls2 lr_decay_rate 0.2824295364810001_get_param_groups name module.module.decoder.layers.19.mlp.linear_fc1.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.22.ls2 lr_decay_rate 0.81 _get_param_groups name module.module.decoder.layers.25.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.4.self_attention.linear_proj.weight lr_decay_rate 0.12157665459056935 name module.module.external_feature_model.vit.decoder.layers.13.mlp.linear_fc1.bias lr_decay_rate 0.31381059609000006 _get_param_groups name module.module.decoder.layers.30.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.30.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.23.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.30.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.17.input_layernorm.weight lr_decay_rate 0.4782969000000001name module.module.external_feature_model.vit.decoder.layers.21.self_attention.linear_proj.weight lr_decay_rate 0.7290000000000001_get_param_groups name module.module.decoder.layers.45.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.26.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.ls2 key (0.0, 0.028242953648100012, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.ls2 key (0.0, 0.08100000000000002, False, False) _get_param_groups name module.module.decoder.layers.30.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.14.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.25.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.27.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.self_attention.linear_proj.weight key (1.0, 0.012157665459056936, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.mlp.linear_fc1.bias key (0.0, 0.031381059609000006, False, False)_get_param_groups name module.module.decoder.layers.19.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.23.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.self_attention.linear_proj.weight key (1.0, 0.0729, False, False)_get_param_groups name module.module.decoder.layers.31.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.45.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.input_layernorm.weight key (0.0, 0.04782969000000001, False, False) _get_param_groups name module.module.decoder.layers.30.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.26.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.4.self_attention.linear_proj.bias lr_decay_rate 0.12157665459056935_get_param_groups name module.module.decoder.layers.30.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.12.input_layernorm.weight lr_decay_rate 0.2824295364810001_get_param_groups name module.module.decoder.layers.25.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.14.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.27.self_attention.linear_proj.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.22.input_layernorm.weight lr_decay_rate 0.81name module.module.external_feature_model.vit.decoder.layers.13.mlp.linear_fc2.weight lr_decay_rate 0.31381059609000006name module.module.external_feature_model.vit.decoder.layers.21.self_attention.linear_proj.bias lr_decay_rate 0.7290000000000001 _get_param_groups name module.module.decoder.layers.20.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.26.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.24.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.45.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.31.self_attention.linear_proj.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.17.input_layernorm.bias lr_decay_rate 0.4782969000000001_get_param_groups name module.module.decoder.layers.30.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.input_layernorm.weight key (0.0, 0.028242953648100012, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.self_attention.linear_proj.bias key (0.0, 0.012157665459056936, False, False) _get_param_groups name module.module.decoder.layers.27.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.25.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.input_layernorm.weight key (0.0, 0.08100000000000002, False, False)_get_param_groups name module.module.decoder.layers.30.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.mlp.linear_fc2.weight key (1.0, 0.031381059609000006, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.self_attention.linear_proj.bias key (0.0, 0.0729, False, False) _get_param_groups name module.module.decoder.layers.14.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.45.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.input_layernorm.bias key (0.0, 0.04782969000000001, False, False) _get_param_groups name module.module.decoder.layers.26.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.24.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.27.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.30.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.20.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.25.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.31.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.12.input_layernorm.bias lr_decay_rate 0.2824295364810001 name module.module.external_feature_model.vit.decoder.layers.13.mlp.linear_fc2.bias lr_decay_rate 0.31381059609000006 name module.module.external_feature_model.vit.decoder.layers.4.self_attention.linear_qkv.weight lr_decay_rate 0.12157665459056935name module.module.external_feature_model.vit.decoder.layers.22.input_layernorm.bias lr_decay_rate 0.81_get_param_groups name module.module.decoder.layers.30.mlp.linear_fc1.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.21.self_attention.linear_qkv.weight lr_decay_rate 0.7290000000000001 _get_param_groups name module.module.decoder.layers.20.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.17.self_attention.linear_proj.weight lr_decay_rate 0.4782969000000001_get_param_groups name module.module.decoder.layers.27.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.14.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.input_layernorm.bias key (0.0, 0.028242953648100012, False, False) _get_param_groups name module.module.decoder.layers.46.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.self_attention.linear_qkv.weight key (1.0, 0.0729, False, False)_get_param_groups name module.module.decoder.layers.26.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.24.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.31.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.31.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.26.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.30.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.mlp.linear_fc2.bias key (0.0, 0.031381059609000006, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.self_attention.linear_qkv.weight key (1.0, 0.012157665459056936, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.input_layernorm.bias key (0.0, 0.08100000000000002, False, False) _get_param_groups name module.module.decoder.layers.24.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.26.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.20.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.self_attention.linear_proj.weight key (1.0, 0.04782969000000001, False, False) _get_param_groups name module.module.decoder.layers.27.mlp.linear_fc1.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.21.self_attention.linear_qkv.bias lr_decay_rate 0.7290000000000001 name module.module.external_feature_model.vit.decoder.layers.12.self_attention.linear_proj.weight lr_decay_rate 0.2824295364810001 _get_param_groups name module.module.decoder.layers.14.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.26.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.31.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.46.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.31.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.31.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.27.mlp.linear_fc2.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.4.self_attention.linear_qkv.bias lr_decay_rate 0.12157665459056935 name module.module.external_feature_model.vit.decoder.layers.14.ls1 lr_decay_rate 0.3486784401000001_get_param_groups name module.module.decoder.layers.27.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.self_attention.linear_qkv.bias key (0.0, 0.0729, False, False) name module.module.external_feature_model.vit.decoder.layers.17.self_attention.linear_proj.bias lr_decay_rate 0.4782969000000001 _get_param_groups name module.module.decoder.layers.24.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.22.self_attention.linear_proj.weight lr_decay_rate 0.81_get_param_groups name module.module.decoder.layers.20.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.self_attention.linear_proj.weight key (1.0, 0.028242953648100012, False, False) _get_param_groups name module.module.decoder.layers.15.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.26.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.31.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.28.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.46.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.self_attention.linear_qkv.bias key (0.0, 0.012157665459056936, False, False) _get_param_groups name module.module.decoder.layers.31.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.self_attention.linear_proj.bias key (0.0, 0.04782969000000001, False, False) _get_param_groups name module.module.decoder.layers.31.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.ls1 key (0.0, 0.03486784401000001, False, False)_get_param_groups name module.module.decoder.layers.27.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.20.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.self_attention.linear_proj.weight key (1.0, 0.08100000000000002, False, False) _get_param_groups name module.module.decoder.layers.24.mlp.linear_fc1.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.21.pre_mlp_layernorm.weight lr_decay_rate 0.7290000000000001 _get_param_groups name module.module.decoder.layers.31.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.26.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.12.self_attention.linear_proj.bias lr_decay_rate 0.2824295364810001 _get_param_groups name module.module.decoder.layers.46.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.15.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.31.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.17.self_attention.linear_qkv.weight lr_decay_rate 0.4782969000000001 _get_param_groups name module.module.decoder.layers.31.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.27.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.28.self_attention.linear_proj.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.4.pre_mlp_layernorm.weight lr_decay_rate 0.12157665459056935_get_param_groups name module.module.decoder.layers.20.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.self_attention.linear_proj.bias key (0.0, 0.028242953648100012, False, False) name module.module.external_feature_model.vit.decoder.layers.14.ls2 lr_decay_rate 0.3486784401000001 name module.module.external_feature_model.vit.decoder.layers.22.self_attention.linear_proj.bias lr_decay_rate 0.81 _get_param_groups name module.module.decoder.layers.24.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.pre_mlp_layernorm.weight key (0.0, 0.0729, False, False) _get_param_groups name module.module.decoder.layers.31.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.46.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.self_attention.linear_qkv.weight key (1.0, 0.04782969000000001, False, False) _get_param_groups name module.module.decoder.layers.32.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.26.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.ls2 key (0.0, 0.03486784401000001, False, False)_get_param_groups name module.module.decoder.layers.15.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.pre_mlp_layernorm.weight key (0.0, 0.012157665459056936, False, False)name module.module.external_feature_model.vit.decoder.layers.12.self_attention.linear_qkv.weight lr_decay_rate 0.2824295364810001_get_param_groups name module.module.decoder.layers.27.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.21.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.self_attention.linear_proj.bias key (0.0, 0.08100000000000002, False, False)_get_param_groups name module.module.decoder.layers.28.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.31.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.25.input_layernorm.weight key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.21.pre_mlp_layernorm.bias lr_decay_rate 0.7290000000000001 name module.module.external_feature_model.vit.decoder.layers.17.self_attention.linear_qkv.bias lr_decay_rate 0.4782969000000001_get_param_groups name module.module.decoder.layers.46.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.31.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.32.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.26.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.self_attention.linear_qkv.weight key (1.0, 0.028242953648100012, False, False) _get_param_groups name module.module.decoder.layers.15.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.14.input_layernorm.weight lr_decay_rate 0.3486784401000001_get_param_groups name module.module.decoder.layers.31.mlp.linear_fc1.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.4.pre_mlp_layernorm.bias lr_decay_rate 0.12157665459056935 _get_param_groups name module.module.decoder.layers.28.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.21.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.27.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.26.mlp.linear_fc2.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.22.self_attention.linear_qkv.weight lr_decay_rate 0.81_get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.pre_mlp_layernorm.bias key (0.0, 0.0729, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.self_attention.linear_qkv.bias key (0.0, 0.04782969000000001, False, False) _get_param_groups name module.module.decoder.layers.46.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.25.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.pre_mlp_layernorm.bias key (0.0, 0.012157665459056936, False, False)_get_param_groups name module.module.decoder.layers.31.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.32.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.input_layernorm.weight key (0.0, 0.03486784401000001, False, False) name module.module.external_feature_model.vit.decoder.layers.12.self_attention.linear_qkv.bias lr_decay_rate 0.2824295364810001 _get_param_groups name module.module.decoder.layers.27.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.31.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.15.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.self_attention.linear_qkv.weight key (1.0, 0.08100000000000002, False, False)_get_param_groups name module.module.decoder.layers.21.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.21.mlp.linear_fc1.weight lr_decay_rate 0.7290000000000001_get_param_groups name module.module.decoder.layers.28.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.25.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.31.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.32.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.27.input_layernorm.weight key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.14.input_layernorm.bias lr_decay_rate 0.3486784401000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.self_attention.linear_qkv.bias key (0.0, 0.028242953648100012, False, False) _get_param_groups name module.module.decoder.layers.27.mlp.linear_fc2.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.17.pre_mlp_layernorm.weight lr_decay_rate 0.4782969000000001 _get_param_groups name module.module.decoder.layers.47.input_layernorm.weight key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.4.mlp.linear_fc1.weight lr_decay_rate 0.12157665459056935_get_param_groups name module.module.decoder.layers.32.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.mlp.linear_fc1.weight key (1.0, 0.0729, False, False)name module.module.external_feature_model.vit.decoder.layers.22.self_attention.linear_qkv.bias lr_decay_rate 0.81 _get_param_groups name module.module.decoder.layers.15.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.21.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.32.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.25.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.28.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.input_layernorm.bias key (0.0, 0.03486784401000001, False, False)_get_param_groups name module.module.decoder.layers.32.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.self_attention.linear_qkv.bias key (0.0, 0.08100000000000002, False, False) name module.module.external_feature_model.vit.decoder.layers.21.mlp.linear_fc1.bias lr_decay_rate 0.7290000000000001_get_param_groups name module.module.decoder.layers.28.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.mlp.linear_fc1.weight key (1.0, 0.012157665459056936, False, False)_get_param_groups name module.module.decoder.layers.27.self_attention.linear_proj.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.12.pre_mlp_layernorm.weight lr_decay_rate 0.2824295364810001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.pre_mlp_layernorm.weight key (0.0, 0.04782969000000001, False, False) _get_param_groups name module.module.decoder.layers.47.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.32.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.15.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.21.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.32.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.25.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.28.mlp.linear_fc2.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.4.mlp.linear_fc1.bias lr_decay_rate 0.12157665459056935_get_param_groups name module.module.decoder.layers.27.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.32.mlp.linear_fc1.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.14.self_attention.linear_proj.weight lr_decay_rate 0.3486784401000001name module.module.external_feature_model.vit.decoder.layers.22.pre_mlp_layernorm.weight lr_decay_rate 0.81 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.mlp.linear_fc1.bias key (0.0, 0.0729, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.pre_mlp_layernorm.weight key (0.0, 0.028242953648100012, False, False)_get_param_groups name module.module.decoder.layers.28.self_attention.linear_proj.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.17.pre_mlp_layernorm.bias lr_decay_rate 0.4782969000000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.mlp.linear_fc1.bias key (0.0, 0.012157665459056936, False, False)_get_param_groups name module.module.decoder.layers.47.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.32.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.16.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.32.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.27.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.21.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.25.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.self_attention.linear_proj.weight key (1.0, 0.03486784401000001, False, False) _get_param_groups name module.module.decoder.layers.29.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.28.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.12.pre_mlp_layernorm.bias lr_decay_rate 0.2824295364810001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.pre_mlp_layernorm.weight key (0.0, 0.08100000000000002, False, False)_get_param_groups name module.module.decoder.layers.32.mlp.linear_fc2.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.21.mlp.linear_fc2.weight lr_decay_rate 0.7290000000000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.pre_mlp_layernorm.bias key (0.0, 0.04782969000000001, False, False)name module.module.external_feature_model.vit.decoder.layers.4.mlp.linear_fc2.weight lr_decay_rate 0.12157665459056935 _get_param_groups name module.module.decoder.layers.32.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.47.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.32.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.21.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.16.self_attention.linear_proj.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.14.self_attention.linear_proj.bias lr_decay_rate 0.3486784401000001_get_param_groups name module.module.decoder.layers.29.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.25.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.pre_mlp_layernorm.bias key (0.0, 0.028242953648100012, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.mlp.linear_fc2.weight key (1.0, 0.0729, False, False)_get_param_groups name module.module.decoder.layers.28.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.27.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.17.mlp.linear_fc1.weight lr_decay_rate 0.4782969000000001 _get_param_groups name module.module.decoder.layers.33.input_layernorm.weight key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.22.pre_mlp_layernorm.bias lr_decay_rate 0.81 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.mlp.linear_fc2.weight key (1.0, 0.012157665459056936, False, False) _get_param_groups name module.module.decoder.layers.32.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.47.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.32.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.self_attention.linear_proj.bias key (0.0, 0.03486784401000001, False, False)_get_param_groups name module.module.decoder.layers.22.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.29.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.21.mlp.linear_fc2.bias lr_decay_rate 0.7290000000000001 _get_param_groups name module.module.decoder.layers.33.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.16.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.4.mlp.linear_fc2.bias lr_decay_rate 0.12157665459056935 _get_param_groups name module.module.decoder.layers.28.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.32.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.26.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.pre_mlp_layernorm.bias key (0.0, 0.08100000000000002, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.mlp.linear_fc1.weight key (1.0, 0.04782969000000001, False, False) _get_param_groups name module.module.decoder.layers.27.mlp.linear_fc1.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.12.mlp.linear_fc1.weight lr_decay_rate 0.2824295364810001_get_param_groups name module.module.decoder.layers.29.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.47.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.32.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.33.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.16.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.mlp.linear_fc2.bias key (0.0, 0.0729, False, False)_get_param_groups name module.module.decoder.layers.32.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.28.mlp.linear_fc1.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.14.self_attention.linear_qkv.weight lr_decay_rate 0.3486784401000001 _get_param_groups name module.module.decoder.layers.22.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.4.mlp.linear_fc2.bias key (0.0, 0.012157665459056936, False, False) name module.module.external_feature_model.vit.decoder.layers.17.mlp.linear_fc1.bias lr_decay_rate 0.4782969000000001_get_param_groups name module.module.decoder.layers.27.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.26.self_attention.linear_proj.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.22.mlp.linear_fc1.weight lr_decay_rate 0.81_get_param_groups name module.module.decoder.layers.29.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.28.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.mlp.linear_fc1.weight key (1.0, 0.028242953648100012, False, False) _get_param_groups name module.module.decoder.layers.47.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.32.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.33.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.self_attention.linear_qkv.weight key (1.0, 0.03486784401000001, False, False)_get_param_groups name module.module.decoder.layers.33.input_layernorm.weight key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.22.ls1 lr_decay_rate 0.81name module.module.external_feature_model.vit.decoder.layers.5.ls1 lr_decay_rate 0.13508517176729928 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.mlp.linear_fc1.weight key (1.0, 0.08100000000000002, False, False)_get_param_groups name module.module.decoder.layers.28.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.16.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.22.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.mlp.linear_fc1.bias key (0.0, 0.04782969000000001, False, False)_get_param_groups name module.module.decoder.layers.26.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.29.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.29.mlp.linear_fc1.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.12.mlp.linear_fc1.bias lr_decay_rate 0.2824295364810001 _get_param_groups name module.module.decoder.final_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.33.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.33.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.ls1 key (0.0, 0.08100000000000002, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.ls1 key (0.0, 0.013508517176729929, False, False) name module.module.external_feature_model.vit.decoder.layers.14.self_attention.linear_qkv.bias lr_decay_rate 0.3486784401000001_get_param_groups name module.module.decoder.layers.16.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.22.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.29.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.33.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.22.mlp.linear_fc1.bias lr_decay_rate 0.81 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.mlp.linear_fc1.bias key (0.0, 0.028242953648100012, False, False) _get_param_groups name module.module.decoder.layers.28.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.26.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.17.mlp.linear_fc2.weight lr_decay_rate 0.4782969000000001 _get_param_groups name module.module.decoder.layers.29.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.33.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.output_layer.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.33.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.16.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.self_attention.linear_qkv.bias key (0.0, 0.03486784401000001, False, False) name module.module.external_feature_model.vit.decoder.layers.22.ls2 lr_decay_rate 0.81 name module.module.external_feature_model.vit.decoder.layers.5.ls2 lr_decay_rate 0.13508517176729928 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.mlp.linear_fc1.bias key (0.0, 0.08100000000000002, False, False)_get_param_groups name module.module.decoder.layers.33.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.30.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.22.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.28.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.12.mlp.linear_fc2.weight lr_decay_rate 0.2824295364810001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.mlp.linear_fc2.weight key (1.0, 0.04782969000000001, False, False) _get_param_groups name module.module.decoder.layers.26.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.33.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.29.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.17.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.ls2 key (0.0, 0.013508517176729929, False, False) _get_param_groups name module.module.decoder.layers.33.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.22.mlp.linear_fc2.weight lr_decay_rate 0.81 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.ls2 key (0.0, 0.08100000000000002, False, False) _get_param_groups name module.module.decoder.layers.33.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.28.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.14.pre_mlp_layernorm.weight lr_decay_rate 0.3486784401000001 _get_param_groups name module.module.decoder.layers.30.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.22.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.mlp.linear_fc2.weight key (1.0, 0.028242953648100012, False, False) _get_param_groups name module.module.decoder.layers.33.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.17.mlp.linear_fc2.bias lr_decay_rate 0.4782969000000001 _get_param_groups name module.module.decoder.layers.29.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.26.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.17.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.mlp.linear_fc2.weight key (1.0, 0.08100000000000002, False, False)_get_param_groups name module.module.decoder.layers.33.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.5.input_layernorm.weight lr_decay_rate 0.13508517176729928 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.pre_mlp_layernorm.weight key (0.0, 0.03486784401000001, False, False)name module.module.external_feature_model.vit.decoder.layers.22.input_layernorm.weight lr_decay_rate 0.81_get_param_groups name module.module.decoder.layers.22.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.34.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.mlp.linear_fc2.bias key (0.0, 0.04782969000000001, False, False)_get_param_groups name module.module.decoder.layers.30.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.12.mlp.linear_fc2.bias lr_decay_rate 0.2824295364810001_get_param_groups name module.module.decoder.layers.28.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.26.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.33.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.input_layernorm.weight key (0.0, 0.013508517176729929, False, False)_get_param_groups name module.module.decoder.layers.29.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.22.mlp.linear_fc2.bias lr_decay_rate 0.81name module.module.external_feature_model.vit.decoder.layers.14.pre_mlp_layernorm.bias lr_decay_rate 0.3486784401000001_get_param_groups name module.module.decoder.layers.17.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.input_layernorm.weight key (0.0, 0.08100000000000002, False, False) _get_param_groups name module.module.decoder.layers.33.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.23.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.30.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.28.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.33.mlp.linear_fc2.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.18.ls1 lr_decay_rate 0.531441_get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.mlp.linear_fc2.bias key (0.0, 0.028242953648100012, False, False) _get_param_groups name module.module.decoder.layers.27.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.34.self_attention.linear_proj.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.5.input_layernorm.bias lr_decay_rate 0.13508517176729928 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.pre_mlp_layernorm.bias key (0.0, 0.03486784401000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.mlp.linear_fc2.bias key (0.0, 0.08100000000000002, False, False) _get_param_groups name module.module.decoder.layers.29.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.17.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.22.input_layernorm.bias lr_decay_rate 0.81 _get_param_groups name module.module.decoder.layers.33.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.ls1 key (0.0, 0.05314410000000001, False, False) _get_param_groups name module.module.decoder.layers.28.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.23.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.34.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.30.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.input_layernorm.bias key (0.0, 0.013508517176729929, False, False)name module.module.external_feature_model.vit.decoder.layers.14.mlp.linear_fc1.weight lr_decay_rate 0.3486784401000001name module.module.external_feature_model.vit.decoder.layers.13.ls1 lr_decay_rate 0.31381059609000006 _get_param_groups name module.module.decoder.layers.34.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.27.self_attention.linear_proj.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.23.ls1 lr_decay_rate 0.9 _get_param_groups name module.module.decoder.layers.29.mlp.linear_fc2.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.18.ls2 lr_decay_rate 0.531441_get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.input_layernorm.bias key (0.0, 0.08100000000000002, False, False) _get_param_groups name module.module.decoder.layers.33.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.17.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.23.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.29.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.mlp.linear_fc1.weight key (1.0, 0.03486784401000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.ls1 key (0.0, 0.031381059609000006, False, False)_get_param_groups name module.module.decoder.layers.34.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.ls2 key (0.0, 0.05314410000000001, False, False) _get_param_groups name module.module.decoder.layers.30.mlp.linear_fc1.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.5.self_attention.linear_proj.weight lr_decay_rate 0.13508517176729928_get_param_groups name module.module.decoder.layers.34.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.27.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.ls1 key (0.0, 0.09000000000000001, False, False) _get_param_groups name module.module.decoder.layers.30.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.23.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.34.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.17.mlp.linear_fc1.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.22.self_attention.linear_proj.weight lr_decay_rate 0.81 name module.module.external_feature_model.vit.decoder.layers.14.mlp.linear_fc1.bias lr_decay_rate 0.3486784401000001 _get_param_groups name module.module.decoder.layers.29.self_attention.linear_proj.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.13.ls2 lr_decay_rate 0.31381059609000006_get_param_groups name module.module.decoder.layers.34.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.23.ls2 lr_decay_rate 0.9_get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.self_attention.linear_proj.weight key (1.0, 0.013508517176729929, False, False)_get_param_groups name module.module.decoder.layers.27.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.34.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.30.mlp.linear_fc2.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.18.input_layernorm.weight lr_decay_rate 0.531441 _get_param_groups name module.module.decoder.layers.30.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.17.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.self_attention.linear_proj.weight key (1.0, 0.08100000000000002, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.mlp.linear_fc1.bias key (0.0, 0.03486784401000001, False, False) _get_param_groups name module.module.decoder.layers.23.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.34.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.29.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.ls2 key (0.0, 0.09000000000000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.ls2 key (0.0, 0.031381059609000006, False, False) _get_param_groups name module.module.decoder.layers.31.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.34.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.34.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.5.self_attention.linear_proj.bias lr_decay_rate 0.13508517176729928_get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.input_layernorm.weight key (0.0, 0.05314410000000001, False, False)_get_param_groups name module.module.decoder.layers.27.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.30.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.22.self_attention.linear_proj.bias lr_decay_rate 0.81 _get_param_groups name module.module.decoder.layers.29.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.18.input_layernorm.weight key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.14.mlp.linear_fc2.weight lr_decay_rate 0.3486784401000001_get_param_groups name module.module.decoder.layers.23.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.34.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.13.input_layernorm.weight lr_decay_rate 0.31381059609000006_get_param_groups name module.module.decoder.layers.30.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.23.input_layernorm.weight lr_decay_rate 0.9name module.module.external_feature_model.vit.decoder.layers.18.input_layernorm.bias lr_decay_rate 0.531441_get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.self_attention.linear_proj.bias key (0.0, 0.013508517176729929, False, False)_get_param_groups name module.module.decoder.layers.34.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.self_attention.linear_proj.bias key (0.0, 0.08100000000000002, False, False)_get_param_groups name module.module.decoder.layers.27.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.31.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.34.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.29.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.23.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.input_layernorm.weight key (0.0, 0.031381059609000006, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.mlp.linear_fc2.weight key (1.0, 0.03486784401000001, False, False) _get_param_groups name module.module.decoder.layers.18.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.input_layernorm.weight key (0.0, 0.09000000000000001, False, False)_get_param_groups name module.module.decoder.layers.30.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.34.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.35.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.input_layernorm.bias key (0.0, 0.05314410000000001, False, False)name module.module.external_feature_model.vit.decoder.layers.5.self_attention.linear_qkv.weight lr_decay_rate 0.13508517176729928_get_param_groups name module.module.decoder.layers.27.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.34.mlp.linear_fc1.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.22.self_attention.linear_qkv.weight lr_decay_rate 0.81 _get_param_groups name module.module.decoder.layers.31.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.29.mlp.linear_fc1.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.14.mlp.linear_fc2.bias lr_decay_rate 0.3486784401000001 _get_param_groups name module.module.decoder.layers.24.input_layernorm.weight key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.13.input_layernorm.bias lr_decay_rate 0.31381059609000006 _get_param_groups name module.module.decoder.layers.18.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.self_attention.linear_qkv.weight key (1.0, 0.013508517176729929, False, False)name module.module.external_feature_model.vit.decoder.layers.23.input_layernorm.bias lr_decay_rate 0.9_get_param_groups name module.module.decoder.layers.35.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.34.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.self_attention.linear_qkv.weight key (1.0, 0.08100000000000002, False, False)_get_param_groups name module.module.decoder.layers.31.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.mlp.linear_fc2.bias key (0.0, 0.03486784401000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.input_layernorm.bias key (0.0, 0.031381059609000006, False, False)_get_param_groups name module.module.decoder.layers.28.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.34.mlp.linear_fc2.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.18.self_attention.linear_proj.weight lr_decay_rate 0.531441 _get_param_groups name module.module.decoder.layers.29.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.18.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.24.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.input_layernorm.bias key (0.0, 0.09000000000000001, False, False)name module.module.external_feature_model.vit.decoder.layers.5.self_attention.linear_qkv.bias lr_decay_rate 0.13508517176729928 _get_param_groups name module.module.decoder.layers.31.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.35.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.22.self_attention.linear_qkv.bias lr_decay_rate 0.81_get_param_groups name module.module.decoder.layers.34.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.self_attention.linear_proj.weight key (1.0, 0.05314410000000001, False, False) name module.module.external_feature_model.vit.decoder.layers.15.ls1 lr_decay_rate 0.3874204890000001name module.module.external_feature_model.vit.decoder.layers.13.self_attention.linear_proj.weight lr_decay_rate 0.31381059609000006 _get_param_groups name module.module.decoder.layers.35.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.28.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.30.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.31.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.24.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.self_attention.linear_qkv.bias key (0.0, 0.013508517176729929, False, False)name module.module.external_feature_model.vit.decoder.layers.23.self_attention.linear_proj.weight lr_decay_rate 0.9_get_param_groups name module.module.decoder.layers.34.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.18.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.ls1 key (0.0, 0.03874204890000001, False, False) _get_param_groups name module.module.decoder.layers.35.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.self_attention.linear_qkv.bias key (0.0, 0.08100000000000002, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.self_attention.linear_proj.weight key (1.0, 0.031381059609000006, False, False) name module.module.external_feature_model.vit.decoder.layers.18.self_attention.linear_proj.bias lr_decay_rate 0.531441_get_param_groups name module.module.decoder.layers.35.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.30.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.24.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.28.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.31.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.self_attention.linear_proj.weight key (1.0, 0.09000000000000001, False, False) _get_param_groups name module.module.decoder.layers.35.input_layernorm.weight key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.13.self_attention.linear_proj.bias lr_decay_rate 0.31381059609000006_get_param_groups name module.module.decoder.layers.18.mlp.linear_fc1.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.5.pre_mlp_layernorm.weight lr_decay_rate 0.13508517176729928_get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.self_attention.linear_proj.bias key (0.0, 0.05314410000000001, False, False)name module.module.external_feature_model.vit.decoder.layers.15.ls2 lr_decay_rate 0.3874204890000001 _get_param_groups name module.module.decoder.layers.35.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.32.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.30.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.30.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.35.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.28.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.22.pre_mlp_layernorm.weight lr_decay_rate 0.81 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.self_attention.linear_proj.bias key (0.0, 0.031381059609000006, False, False)name module.module.external_feature_model.vit.decoder.layers.23.self_attention.linear_proj.bias lr_decay_rate 0.9_get_param_groups name module.module.decoder.layers.24.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.35.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.pre_mlp_layernorm.weight key (0.0, 0.013508517176729929, False, False)_get_param_groups name module.module.decoder.layers.18.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.ls2 key (0.0, 0.03874204890000001, False, False)name module.module.external_feature_model.vit.decoder.layers.18.self_attention.linear_qkv.weight lr_decay_rate 0.531441 _get_param_groups name module.module.decoder.layers.35.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.32.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.self_attention.linear_proj.bias key (0.0, 0.09000000000000001, False, False) _get_param_groups name module.module.decoder.layers.30.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.30.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.28.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.35.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.pre_mlp_layernorm.weight key (0.0, 0.08100000000000002, False, False) _get_param_groups name module.module.decoder.layers.24.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.35.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.13.self_attention.linear_qkv.weight lr_decay_rate 0.31381059609000006name module.module.external_feature_model.vit.decoder.layers.5.pre_mlp_layernorm.bias lr_decay_rate 0.13508517176729928_get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.self_attention.linear_qkv.weight key (1.0, 0.05314410000000001, False, False) name module.module.external_feature_model.vit.decoder.layers.15.input_layernorm.weight lr_decay_rate 0.3874204890000001 _get_param_groups name module.module.decoder.layers.32.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.19.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.35.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.23.self_attention.linear_qkv.weight lr_decay_rate 0.9_get_param_groups name module.module.decoder.layers.28.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.31.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.35.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.30.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.22.pre_mlp_layernorm.bias lr_decay_rate 0.81 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.self_attention.linear_qkv.weight key (1.0, 0.031381059609000006, False, False) name module.module.external_feature_model.vit.decoder.layers.18.self_attention.linear_qkv.bias lr_decay_rate 0.531441 _get_param_groups name module.module.decoder.layers.35.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.24.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.32.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.pre_mlp_layernorm.bias key (0.0, 0.013508517176729929, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.input_layernorm.weight key (0.0, 0.03874204890000001, False, False) _get_param_groups name module.module.decoder.layers.35.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.19.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.36.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.self_attention.linear_qkv.weight key (1.0, 0.09000000000000001, False, False)_get_param_groups name module.module.decoder.layers.28.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.31.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.pre_mlp_layernorm.bias key (0.0, 0.08100000000000002, False, False) _get_param_groups name module.module.decoder.layers.30.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.self_attention.linear_qkv.bias key (0.0, 0.05314410000000001, False, False)name module.module.external_feature_model.vit.decoder.layers.15.input_layernorm.bias lr_decay_rate 0.3874204890000001name module.module.external_feature_model.vit.decoder.layers.13.self_attention.linear_qkv.bias lr_decay_rate 0.31381059609000006 name module.module.external_feature_model.vit.decoder.layers.5.mlp.linear_fc1.weight lr_decay_rate 0.13508517176729928 _get_param_groups name module.module.decoder.layers.32.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.25.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.35.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.35.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.36.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.29.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.31.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.19.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.23.self_attention.linear_qkv.bias lr_decay_rate 0.9 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.input_layernorm.bias key (0.0, 0.03874204890000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.self_attention.linear_qkv.bias key (0.0, 0.031381059609000006, False, False) name module.module.external_feature_model.vit.decoder.layers.22.mlp.linear_fc1.weight lr_decay_rate 0.81 _get_param_groups name module.module.decoder.layers.36.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.30.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.mlp.linear_fc1.weight key (1.0, 0.013508517176729929, False, False) _get_param_groups name module.module.decoder.layers.32.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.25.self_attention.linear_proj.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.18.pre_mlp_layernorm.weight lr_decay_rate 0.531441_get_param_groups name module.module.decoder.layers.31.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.self_attention.linear_qkv.bias key (0.0, 0.09000000000000001, False, False) _get_param_groups name module.module.decoder.layers.35.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.29.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.36.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.19.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.mlp.linear_fc1.weight key (1.0, 0.08100000000000002, False, False)name module.module.external_feature_model.vit.decoder.layers.13.pre_mlp_layernorm.weight lr_decay_rate 0.31381059609000006 _get_param_groups name module.module.decoder.layers.31.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.32.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.25.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.15.self_attention.linear_proj.weight lr_decay_rate 0.3874204890000001 _get_param_groups name module.module.decoder.layers.36.self_attention.linear_proj.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.5.mlp.linear_fc1.bias lr_decay_rate 0.13508517176729928 _get_param_groups name module.module.decoder.layers.36.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.pre_mlp_layernorm.weight key (0.0, 0.05314410000000001, False, False) _get_param_groups name module.module.decoder.layers.29.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.35.mlp.linear_fc2.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.22.mlp.linear_fc1.bias lr_decay_rate 0.81 _get_param_groups name module.module.decoder.layers.31.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.19.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.23.pre_mlp_layernorm.weight lr_decay_rate 0.9 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.pre_mlp_layernorm.weight key (0.0, 0.031381059609000006, False, False)_get_param_groups name module.module.decoder.layers.33.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.36.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.31.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.25.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.mlp.linear_fc1.bias key (0.0, 0.013508517176729929, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.self_attention.linear_proj.weight key (1.0, 0.03874204890000001, False, False)_get_param_groups name module.module.decoder.layers.36.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.29.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.18.pre_mlp_layernorm.bias lr_decay_rate 0.531441_get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.mlp.linear_fc1.bias key (0.0, 0.08100000000000002, False, False) _get_param_groups name module.module.decoder.layers.36.input_layernorm.weight key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.13.pre_mlp_layernorm.bias lr_decay_rate 0.31381059609000006 _get_param_groups name module.module.decoder.layers.31.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.pre_mlp_layernorm.weight key (0.0, 0.09000000000000001, False, False)_get_param_groups name module.module.decoder.layers.36.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.19.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.31.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.33.self_attention.linear_proj.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.5.mlp.linear_fc2.weight lr_decay_rate 0.13508517176729928name module.module.external_feature_model.vit.decoder.layers.22.mlp.linear_fc2.weight lr_decay_rate 0.81 _get_param_groups name module.module.decoder.layers.36.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.25.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.pre_mlp_layernorm.bias key (0.0, 0.05314410000000001, False, False)name module.module.external_feature_model.vit.decoder.layers.15.self_attention.linear_proj.bias lr_decay_rate 0.3874204890000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.pre_mlp_layernorm.bias key (0.0, 0.031381059609000006, False, False)_get_param_groups name module.module.decoder.layers.29.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.36.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.36.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.31.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.mlp.linear_fc2.weight key (1.0, 0.08100000000000002, False, False) _get_param_groups name module.module.decoder.layers.31.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.23.pre_mlp_layernorm.bias lr_decay_rate 0.9_get_param_groups name module.module.decoder.layers.19.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.33.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.36.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.mlp.linear_fc2.weight key (1.0, 0.013508517176729929, False, False)_get_param_groups name module.module.decoder.layers.25.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.self_attention.linear_proj.bias key (0.0, 0.03874204890000001, False, False) name module.module.external_feature_model.vit.decoder.layers.18.mlp.linear_fc1.weight lr_decay_rate 0.531441 _get_param_groups name module.module.decoder.layers.29.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.36.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.13.mlp.linear_fc1.weight lr_decay_rate 0.31381059609000006 _get_param_groups name module.module.decoder.layers.32.input_layernorm.weight key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.22.mlp.linear_fc2.bias lr_decay_rate 0.81 _get_param_groups name module.module.decoder.layers.36.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.33.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.pre_mlp_layernorm.bias key (0.0, 0.09000000000000001, False, False) name module.module.external_feature_model.vit.decoder.layers.5.mlp.linear_fc2.bias lr_decay_rate 0.13508517176729928 _get_param_groups name module.module.decoder.layers.20.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.31.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.37.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.25.mlp.linear_fc2.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.15.self_attention.linear_qkv.weight lr_decay_rate 0.3874204890000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.mlp.linear_fc1.weight key (1.0, 0.05314410000000001, False, False) _get_param_groups name module.module.decoder.layers.29.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.36.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.36.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.32.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.mlp.linear_fc1.weight key (1.0, 0.031381059609000006, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.mlp.linear_fc2.bias key (0.0, 0.08100000000000002, False, False)_get_param_groups name module.module.decoder.layers.33.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.20.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.5.mlp.linear_fc2.bias key (0.0, 0.013508517176729929, False, False) name module.module.external_feature_model.vit.decoder.layers.23.mlp.linear_fc1.weight lr_decay_rate 0.9 _get_param_groups name module.module.decoder.layers.31.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.self_attention.linear_qkv.weight key (1.0, 0.03874204890000001, False, False)_get_param_groups name module.module.decoder.layers.30.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.26.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.37.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.37.input_layernorm.weight key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.18.mlp.linear_fc1.bias lr_decay_rate 0.531441 _get_param_groups name module.module.decoder.layers.32.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.36.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.13.mlp.linear_fc1.bias lr_decay_rate 0.31381059609000006_get_param_groups name module.module.decoder.layers.20.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.23.ls1 lr_decay_rate 0.9 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.mlp.linear_fc1.weight key (1.0, 0.09000000000000001, False, False) _get_param_groups name module.module.decoder.layers.33.mlp.linear_fc1.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.6.ls1 lr_decay_rate 0.15009463529699918 _get_param_groups name module.module.decoder.layers.31.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.30.self_attention.linear_proj.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.15.self_attention.linear_qkv.bias lr_decay_rate 0.3874204890000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.mlp.linear_fc1.bias key (0.0, 0.05314410000000001, False, False)_get_param_groups name module.module.decoder.layers.26.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.mlp.linear_fc1.bias key (0.0, 0.031381059609000006, False, False)_get_param_groups name module.module.decoder.layers.20.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.37.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.37.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.32.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.self_attention.linear_qkv.bias key (0.0, 0.03874204890000001, False, False) _get_param_groups name module.module.decoder.layers.37.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.ls1 key (0.0, 0.09000000000000001, False, False) _get_param_groups name module.module.decoder.layers.36.mlp.linear_fc1.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.23.mlp.linear_fc1.bias lr_decay_rate 0.9_get_param_groups name module.module.decoder.layers.33.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.ls1 key (0.0, 0.015009463529699918, False, False)_get_param_groups name module.module.decoder.layers.30.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.32.input_layernorm.weight key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.18.mlp.linear_fc2.weight lr_decay_rate 0.531441_get_param_groups name module.module.decoder.layers.26.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.37.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.13.mlp.linear_fc2.weight lr_decay_rate 0.31381059609000006_get_param_groups name module.module.decoder.layers.20.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.mlp.linear_fc1.bias key (0.0, 0.09000000000000001, False, False) _get_param_groups name module.module.decoder.layers.37.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.15.pre_mlp_layernorm.weight lr_decay_rate 0.3874204890000001 _get_param_groups name module.module.decoder.layers.36.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.mlp.linear_fc2.weight key (1.0, 0.05314410000000001, False, False) name module.module.external_feature_model.vit.decoder.layers.23.ls2 lr_decay_rate 0.9_get_param_groups name module.module.decoder.layers.30.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.32.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.26.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.34.input_layernorm.weight key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.6.ls2 lr_decay_rate 0.15009463529699918_get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.mlp.linear_fc2.weight key (1.0, 0.031381059609000006, False, False) _get_param_groups name module.module.decoder.layers.32.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.pre_mlp_layernorm.weight key (0.0, 0.03874204890000001, False, False) _get_param_groups name module.module.decoder.layers.37.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.37.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.20.mlp.linear_fc1.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.23.mlp.linear_fc2.weight lr_decay_rate 0.9_get_param_groups name module.module.decoder.layers.37.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.ls2 key (0.0, 0.015009463529699918, False, False) _get_param_groups name module.module.decoder.layers.32.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.ls2 key (0.0, 0.09000000000000001, False, False)name module.module.external_feature_model.vit.decoder.layers.18.mlp.linear_fc2.bias lr_decay_rate 0.531441 _get_param_groups name module.module.decoder.layers.34.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.32.mlp.linear_fc1.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.15.pre_mlp_layernorm.bias lr_decay_rate 0.3874204890000001 _get_param_groups name module.module.decoder.layers.30.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.26.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.13.mlp.linear_fc2.bias lr_decay_rate 0.31381059609000006 _get_param_groups name module.module.decoder.layers.37.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.37.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.37.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.20.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.mlp.linear_fc2.weight key (1.0, 0.09000000000000001, False, False) _get_param_groups name module.module.decoder.layers.32.mlp.linear_fc2.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.23.input_layernorm.weight lr_decay_rate 0.9 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.mlp.linear_fc2.bias key (0.0, 0.031381059609000006, False, False)_get_param_groups name module.module.decoder.layers.34.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.mlp.linear_fc2.bias key (0.0, 0.05314410000000001, False, False)_get_param_groups name module.module.decoder.layers.32.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.6.input_layernorm.weight lr_decay_rate 0.15009463529699918_get_param_groups name module.module.decoder.layers.26.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.30.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.pre_mlp_layernorm.bias key (0.0, 0.03874204890000001, False, False) _get_param_groups name module.module.decoder.layers.37.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.33.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.21.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.38.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.34.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.37.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.input_layernorm.weight key (0.0, 0.09000000000000001, False, False) name module.module.external_feature_model.vit.decoder.layers.23.mlp.linear_fc2.bias lr_decay_rate 0.9 name module.module.external_feature_model.vit.decoder.layers.19.ls1 lr_decay_rate 0.5904900000000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.input_layernorm.weight key (0.0, 0.015009463529699918, False, False)_get_param_groups name module.module.decoder.layers.37.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.26.mlp.linear_fc2.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.14.ls1 lr_decay_rate 0.3486784401000001_get_param_groups name module.module.decoder.layers.32.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.37.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.30.mlp.linear_fc2.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.15.mlp.linear_fc1.weight lr_decay_rate 0.3874204890000001 _get_param_groups name module.module.decoder.layers.33.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.mlp.linear_fc2.bias key (0.0, 0.09000000000000001, False, False)name module.module.external_feature_model.vit.decoder.layers.23.input_layernorm.bias lr_decay_rate 0.9 _get_param_groups name module.module.decoder.layers.21.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.38.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.34.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.6.input_layernorm.bias lr_decay_rate 0.15009463529699918 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.ls1 key (0.0, 0.05904900000000001, False, False)_get_param_groups name module.module.decoder.layers.32.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.ls1 key (0.0, 0.03486784401000001, False, False) _get_param_groups name module.module.decoder.layers.27.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.31.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.37.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.38.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.mlp.linear_fc1.weight key (1.0, 0.03874204890000001, False, False)_get_param_groups name module.module.decoder.layers.33.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.input_layernorm.bias key (0.0, 0.09000000000000001, False, False) _get_param_groups name module.module.decoder.layers.38.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.input_layernorm.bias key (0.0, 0.015009463529699918, False, False) _get_param_groups name module.module.decoder.layers.34.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vision_projection.encoder.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.21.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.19.ls2 lr_decay_rate 0.5904900000000001name module.module.external_feature_model.vit.decoder.layers.14.ls2 lr_decay_rate 0.3486784401000001 _get_param_groups name module.module.decoder.layers.32.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.27.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.37.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.31.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.33.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.15.mlp.linear_fc1.bias lr_decay_rate 0.3874204890000001 name module.module.external_feature_model.vit.decoder.layers.6.self_attention.linear_proj.weight lr_decay_rate 0.15009463529699918_get_param_groups name module.module.decoder.layers.38.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.34.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.38.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.23.self_attention.linear_proj.weight lr_decay_rate 0.9_get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.ls2 key (0.0, 0.05904900000000001, False, False) _get_param_groups name module.module.external_feature_model.vision_projection.encoder.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.27.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.21.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.ls2 key (0.0, 0.03486784401000001, False, False) _get_param_groups name module.module.decoder.layers.33.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.33.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.37.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.mlp.linear_fc1.bias key (0.0, 0.03874204890000001, False, False) _get_param_groups name module.module.decoder.layers.31.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.38.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.self_attention.linear_proj.weight key (1.0, 0.09000000000000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.self_attention.linear_proj.weight key (1.0, 0.015009463529699918, False, False) _get_param_groups name module.module.decoder.layers.35.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.27.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.38.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.14.input_layernorm.weight lr_decay_rate 0.3486784401000001name module.module.external_feature_model.vit.decoder.layers.19.input_layernorm.weight lr_decay_rate 0.5904900000000001 _get_param_groups name module.module.external_feature_model.pre_proj_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.38.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.31.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.21.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.33.self_attention.linear_proj.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.15.mlp.linear_fc2.weight lr_decay_rate 0.3874204890000001_get_param_groups name module.module.decoder.layers.38.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.33.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.38.mlp.linear_fc1.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.23.self_attention.linear_proj.bias lr_decay_rate 0.9 name module.module.external_feature_model.vit.decoder.layers.6.self_attention.linear_proj.bias lr_decay_rate 0.15009463529699918 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.input_layernorm.weight key (0.0, 0.05904900000000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.input_layernorm.weight key (0.0, 0.03486784401000001, False, False)_get_param_groups name module.module.decoder.layers.35.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.27.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.21.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.pre_proj_layernorm.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.self_attention.linear_proj.bias key (0.0, 0.09000000000000001, False, False)_get_param_groups name module.module.decoder.layers.38.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.38.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.33.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.mlp.linear_fc2.weight key (1.0, 0.03874204890000001, False, False)_get_param_groups name module.module.decoder.layers.31.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.33.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.38.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.self_attention.linear_proj.bias key (0.0, 0.015009463529699918, False, False) _get_param_groups name module.module.decoder.layers.21.mlp.linear_fc2.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.19.input_layernorm.bias lr_decay_rate 0.5904900000000001_get_param_groups name module.module.decoder.layers.27.mlp.linear_fc1.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.14.input_layernorm.bias lr_decay_rate 0.3486784401000001 _get_param_groups name module.module.decoder.layers.35.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.embedding.word_embeddings.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.38.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.23.self_attention.linear_qkv.weight lr_decay_rate 0.9 _get_param_groups name module.module.decoder.layers.38.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.34.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.33.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.15.mlp.linear_fc2.bias lr_decay_rate 0.3874204890000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.input_layernorm.bias key (0.0, 0.05904900000000001, False, False) _get_param_groups name module.module.decoder.layers.31.mlp.linear_fc1.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.6.self_attention.linear_qkv.weight lr_decay_rate 0.15009463529699918 _get_param_groups name module.module.decoder.layers.39.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.input_layernorm.bias key (0.0, 0.03486784401000001, False, False) _get_param_groups name module.module.decoder.layers.22.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.38.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.27.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.mlp.linear_fc2.bias key (0.0, 0.03874204890000001, False, False) _get_param_groups name module.module.decoder.layers.35.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.self_attention.linear_qkv.weight key (1.0, 0.09000000000000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.self_attention.linear_qkv.weight key (1.0, 0.015009463529699918, False, False)_get_param_groups name module.module.decoder.layers.38.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.0.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.34.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.31.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.33.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.19.self_attention.linear_proj.weight lr_decay_rate 0.5904900000000001_get_param_groups name module.module.decoder.layers.39.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.28.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.38.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.23.self_attention.linear_qkv.bias lr_decay_rate 0.9 _get_param_groups name module.module.decoder.layers.22.self_attention.linear_proj.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.16.ls1 lr_decay_rate 0.4304672100000001_get_param_groups name module.module.decoder.layers.39.input_layernorm.weight key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.6.self_attention.linear_qkv.bias lr_decay_rate 0.15009463529699918_get_param_groups name module.module.decoder.layers.34.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.35.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.14.self_attention.linear_proj.weight lr_decay_rate 0.3486784401000001_get_param_groups name module.module.decoder.layers.32.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.33.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.39.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.0.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.self_attention.linear_proj.weight key (1.0, 0.05904900000000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.self_attention.linear_qkv.bias key (0.0, 0.09000000000000001, False, False)_get_param_groups name module.module.decoder.layers.28.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.38.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.ls1 key (0.0, 0.04304672100000001, False, False)_get_param_groups name module.module.decoder.layers.34.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.32.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.self_attention.linear_proj.weight key (1.0, 0.03486784401000001, False, False)_get_param_groups name module.module.decoder.layers.35.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.self_attention.linear_qkv.bias key (0.0, 0.015009463529699918, False, False)_get_param_groups name module.module.decoder.layers.22.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.33.mlp.linear_fc2.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.19.self_attention.linear_proj.bias lr_decay_rate 0.5904900000000001 _get_param_groups name module.module.decoder.layers.39.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.39.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.28.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.0.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.23.pre_mlp_layernorm.weight lr_decay_rate 0.9 name module.module.external_feature_model.vit.decoder.layers.16.ls2 lr_decay_rate 0.4304672100000001 _get_param_groups name module.module.decoder.layers.38.mlp.linear_fc2.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.14.self_attention.linear_proj.bias lr_decay_rate 0.3486784401000001 _get_param_groups name module.module.decoder.layers.34.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.32.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.35.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.self_attention.linear_proj.bias key (0.0, 0.05904900000000001, False, False)_get_param_groups name module.module.decoder.layers.22.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.28.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.39.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.self_attention.linear_proj.bias key (0.0, 0.03486784401000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.ls2 key (0.0, 0.04304672100000001, False, False) _get_param_groups name module.module.decoder.layers.34.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.0.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.pre_mlp_layernorm.weight key (0.0, 0.09000000000000001, False, False) _get_param_groups name module.module.decoder.layers.32.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.6.pre_mlp_layernorm.weight lr_decay_rate 0.15009463529699918_get_param_groups name module.module.decoder.layers.39.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.34.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.36.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.39.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.39.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.19.self_attention.linear_qkv.weight lr_decay_rate 0.5904900000000001 _get_param_groups name module.module.decoder.layers.22.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.14.self_attention.linear_qkv.weight lr_decay_rate 0.3486784401000001_get_param_groups name module.module.decoder.layers.28.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.16.input_layernorm.weight lr_decay_rate 0.4304672100000001_get_param_groups name module.module.decoder.layers.34.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.pre_mlp_layernorm.weight key (0.0, 0.015009463529699918, False, False)name module.module.external_feature_model.vit.decoder.layers.23.pre_mlp_layernorm.bias lr_decay_rate 0.9 _get_param_groups name module.module.decoder.layers.39.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.34.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.32.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.39.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.0.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.self_attention.linear_qkv.weight key (1.0, 0.03486784401000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.self_attention.linear_qkv.weight key (1.0, 0.05904900000000001, False, False)_get_param_groups name module.module.decoder.layers.39.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.36.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.34.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.22.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.28.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.input_layernorm.weight key (0.0, 0.04304672100000001, False, False) name module.module.external_feature_model.vit.decoder.layers.6.pre_mlp_layernorm.bias lr_decay_rate 0.15009463529699918_get_param_groups name module.module.decoder.layers.39.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.34.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.pre_mlp_layernorm.bias key (0.0, 0.09000000000000001, False, False)_get_param_groups name module.module.decoder.layers.39.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.32.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.0.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.39.mlp.linear_fc2.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.14.self_attention.linear_qkv.bias lr_decay_rate 0.3486784401000001 name module.module.external_feature_model.vit.decoder.layers.19.self_attention.linear_qkv.bias lr_decay_rate 0.5904900000000001 _get_param_groups name module.module.decoder.layers.36.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.35.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.39.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.28.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.pre_mlp_layernorm.bias key (0.0, 0.015009463529699918, False, False)_get_param_groups name module.module.decoder.layers.22.mlp.linear_fc2.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.16.input_layernorm.bias lr_decay_rate 0.4304672100000001 _get_param_groups name module.module.decoder.layers.34.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.32.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.39.mlp.linear_fc2.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.23.mlp.linear_fc1.weight lr_decay_rate 0.9_get_param_groups name module.module.decoder.layers.0.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.36.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.self_attention.linear_qkv.bias key (0.0, 0.03486784401000001, False, False)_get_param_groups name module.module.decoder.layers.40.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.self_attention.linear_qkv.bias key (0.0, 0.05904900000000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.input_layernorm.bias key (0.0, 0.04304672100000001, False, False)_get_param_groups name module.module.decoder.layers.29.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.39.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.35.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.23.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.mlp.linear_fc1.weight key (1.0, 0.09000000000000001, False, False)name module.module.external_feature_model.vit.decoder.layers.6.mlp.linear_fc1.weight lr_decay_rate 0.15009463529699918 _get_param_groups name module.module.decoder.layers.34.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.1.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.40.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.40.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.33.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.36.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.14.pre_mlp_layernorm.weight lr_decay_rate 0.3486784401000001 name module.module.external_feature_model.vit.decoder.layers.19.pre_mlp_layernorm.weight lr_decay_rate 0.5904900000000001 name module.module.external_feature_model.vit.decoder.layers.23.mlp.linear_fc1.bias lr_decay_rate 0.9_get_param_groups name module.module.decoder.layers.39.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.35.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.23.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.29.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.34.mlp.linear_fc2.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.16.self_attention.linear_proj.weight lr_decay_rate 0.4304672100000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.mlp.linear_fc1.weight key (1.0, 0.015009463529699918, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.pre_mlp_layernorm.weight key (0.0, 0.03486784401000001, False, False)_get_param_groups name module.module.decoder.layers.40.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.40.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.36.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.33.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.pre_mlp_layernorm.weight key (0.0, 0.05904900000000001, False, False) _get_param_groups name module.module.decoder.layers.1.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.mlp.linear_fc1.bias key (0.0, 0.09000000000000001, False, False) _get_param_groups name module.module.decoder.layers.39.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.23.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.40.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.35.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.35.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.29.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.self_attention.linear_proj.weight key (1.0, 0.04304672100000001, False, False)name module.module.external_feature_model.vit.decoder.layers.6.mlp.linear_fc1.bias lr_decay_rate 0.15009463529699918_get_param_groups name module.module.decoder.layers.40.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.19.pre_mlp_layernorm.bias lr_decay_rate 0.5904900000000001name module.module.external_feature_model.vit.decoder.layers.14.pre_mlp_layernorm.bias lr_decay_rate 0.3486784401000001_get_param_groups name module.module.decoder.layers.36.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.33.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.1.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.23.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.23.mlp.linear_fc2.weight lr_decay_rate 0.9_get_param_groups name module.module.decoder.layers.40.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.40.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.35.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.mlp.linear_fc1.bias key (0.0, 0.015009463529699918, False, False) _get_param_groups name module.module.decoder.layers.35.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.1.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.16.self_attention.linear_proj.bias lr_decay_rate 0.4304672100000001 _get_param_groups name module.module.decoder.layers.29.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.40.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.pre_mlp_layernorm.bias key (0.0, 0.05904900000000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.pre_mlp_layernorm.bias key (0.0, 0.03486784401000001, False, False)_get_param_groups name module.module.decoder.layers.33.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.mlp.linear_fc2.weight key (1.0, 0.09000000000000001, False, False)_get_param_groups name module.module.decoder.layers.37.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.35.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.23.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.40.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.self_attention.linear_proj.bias key (0.0, 0.04304672100000001, False, False)name module.module.external_feature_model.vit.decoder.layers.6.mlp.linear_fc2.weight lr_decay_rate 0.15009463529699918_get_param_groups name module.module.decoder.layers.35.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.40.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.40.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.1.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.19.mlp.linear_fc1.weight lr_decay_rate 0.5904900000000001 _get_param_groups name module.module.decoder.layers.29.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.33.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.37.self_attention.linear_proj.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.14.mlp.linear_fc1.weight lr_decay_rate 0.3486784401000001 name module.module.external_feature_model.vit.decoder.layers.23.mlp.linear_fc2.bias lr_decay_rate 0.9_get_param_groups name module.module.decoder.layers.35.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.16.self_attention.linear_qkv.weight lr_decay_rate 0.4304672100000001 _get_param_groups name module.module.decoder.layers.23.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.1.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.40.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.mlp.linear_fc2.weight key (1.0, 0.015009463529699918, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.mlp.linear_fc1.weight key (1.0, 0.05904900000000001, False, False)_get_param_groups name module.module.decoder.layers.35.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.40.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.mlp.linear_fc2.bias key (0.0, 0.09000000000000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.mlp.linear_fc1.weight key (1.0, 0.03486784401000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.self_attention.linear_qkv.weight key (1.0, 0.04304672100000001, False, False)_get_param_groups name module.module.decoder.layers.40.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.37.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.29.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.33.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.35.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.40.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.6.mlp.linear_fc2.bias lr_decay_rate 0.15009463529699918name module.module.external_feature_model.vit.decoder.layers.19.mlp.linear_fc1.bias lr_decay_rate 0.5904900000000001_get_param_groups name module.module.decoder.layers.36.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.23.mlp.linear_fc2.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.14.mlp.linear_fc1.bias lr_decay_rate 0.3486784401000001_get_param_groups name module.module.decoder.layers.1.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.33.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.40.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.41.input_layernorm.weight key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.16.self_attention.linear_qkv.bias lr_decay_rate 0.4304672100000001_get_param_groups name module.module.decoder.layers.37.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.29.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vision_projection.encoder.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.35.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.6.mlp.linear_fc2.bias key (0.0, 0.015009463529699918, False, False)_get_param_groups name module.module.decoder.layers.40.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.mlp.linear_fc1.bias key (0.0, 0.03486784401000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.mlp.linear_fc1.bias key (0.0, 0.05904900000000001, False, False) _get_param_groups name module.module.decoder.layers.36.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.self_attention.linear_qkv.bias key (0.0, 0.04304672100000001, False, False) _get_param_groups name module.module.decoder.layers.24.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.2.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.34.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.41.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.30.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.37.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.41.self_attention.linear_proj.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.7.ls1 lr_decay_rate 0.16677181699666577_get_param_groups name module.module.external_feature_model.vision_projection.encoder.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.35.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.36.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.40.mlp.linear_fc1.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.19.mlp.linear_fc2.weight lr_decay_rate 0.5904900000000001name module.module.external_feature_model.vit.decoder.layers.14.mlp.linear_fc2.weight lr_decay_rate 0.3486784401000001 _get_param_groups name module.module.decoder.layers.30.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.37.mlp.linear_fc1.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.16.pre_mlp_layernorm.weight lr_decay_rate 0.4304672100000001_get_param_groups name module.module.decoder.layers.41.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.ls1 key (0.0, 0.016677181699666577, False, False) _get_param_groups name module.module.decoder.layers.24.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.41.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.34.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.2.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.36.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.mlp.linear_fc2.weight key (1.0, 0.03486784401000001, False, False) _get_param_groups name module.module.decoder.layers.40.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.pre_proj_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.36.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.mlp.linear_fc2.weight key (1.0, 0.05904900000000001, False, False) _get_param_groups name module.module.decoder.layers.30.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.41.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.7.ls2 lr_decay_rate 0.16677181699666577_get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.pre_mlp_layernorm.weight key (0.0, 0.04304672100000001, False, False) _get_param_groups name module.module.decoder.layers.37.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.pre_proj_layernorm.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.24.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.41.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.41.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.34.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.2.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.30.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.14.mlp.linear_fc2.bias lr_decay_rate 0.3486784401000001 _get_param_groups name module.module.decoder.layers.41.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.19.mlp.linear_fc2.bias lr_decay_rate 0.5904900000000001_get_param_groups name module.module.decoder.layers.36.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.16.pre_mlp_layernorm.bias lr_decay_rate 0.4304672100000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.ls2 key (0.0, 0.016677181699666577, False, False) _get_param_groups name module.module.decoder.layers.36.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.38.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.embedding.word_embeddings.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.41.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.24.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.mlp.linear_fc2.bias key (0.0, 0.03486784401000001, False, False)_get_param_groups name module.module.decoder.layers.2.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.34.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.mlp.linear_fc2.bias key (0.0, 0.05904900000000001, False, False) _get_param_groups name module.module.decoder.layers.36.mlp.linear_fc1.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.7.input_layernorm.weight lr_decay_rate 0.16677181699666577_get_param_groups name module.module.decoder.layers.41.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.pre_mlp_layernorm.bias key (0.0, 0.04304672100000001, False, False) _get_param_groups name module.module.decoder.layers.41.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.38.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.30.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.41.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.36.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.15.ls1 lr_decay_rate 0.3874204890000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.input_layernorm.weight key (0.0, 0.016677181699666577, False, False) _get_param_groups name module.module.decoder.layers.24.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.36.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.0.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.2.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.30.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.41.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.38.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.41.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.20.ls1 lr_decay_rate 0.6561 _get_param_groups name module.module.decoder.layers.34.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.16.mlp.linear_fc1.weight lr_decay_rate 0.4304672100000001_get_param_groups name module.module.decoder.layers.41.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.36.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.ls1 key (0.0, 0.03874204890000001, False, False)name module.module.external_feature_model.vit.decoder.layers.7.input_layernorm.bias lr_decay_rate 0.16677181699666577 _get_param_groups name module.module.decoder.layers.24.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.37.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.41.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.ls1 key (0.0, 0.06561, False, False)_get_param_groups name module.module.decoder.layers.0.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.34.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.2.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.30.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.38.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.41.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.mlp.linear_fc1.weight key (1.0, 0.04304672100000001, False, False) _get_param_groups name module.module.decoder.layers.42.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.input_layernorm.bias key (0.0, 0.016677181699666577, False, False) _get_param_groups name module.module.decoder.layers.24.mlp.linear_fc2.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.15.ls2 lr_decay_rate 0.3874204890000001 _get_param_groups name module.module.decoder.layers.36.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.0.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.37.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.31.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.34.mlp.linear_fc2.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.20.ls2 lr_decay_rate 0.6561 _get_param_groups name module.module.decoder.layers.41.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.2.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.42.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.38.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.ls2 key (0.0, 0.03874204890000001, False, False)name module.module.external_feature_model.vit.decoder.layers.7.self_attention.linear_proj.weight lr_decay_rate 0.16677181699666577name module.module.external_feature_model.vit.decoder.layers.16.mlp.linear_fc1.bias lr_decay_rate 0.4304672100000001 _get_param_groups name module.module.decoder.layers.42.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.25.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.36.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.0.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.ls2 key (0.0, 0.06561, False, False)_get_param_groups name module.module.decoder.layers.37.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.35.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.31.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.self_attention.linear_proj.weight key (1.0, 0.016677181699666577, False, False)_get_param_groups name module.module.decoder.layers.42.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.42.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.41.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.3.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.mlp.linear_fc1.bias key (0.0, 0.04304672100000001, False, False)name module.module.external_feature_model.vit.decoder.layers.20.input_layernorm.weight lr_decay_rate 0.6561_get_param_groups name module.module.decoder.layers.38.mlp.linear_fc1.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.15.input_layernorm.weight lr_decay_rate 0.3874204890000001 _get_param_groups name module.module.decoder.layers.37.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.36.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.42.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.0.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.31.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.25.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.42.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.7.self_attention.linear_proj.bias lr_decay_rate 0.16677181699666577 _get_param_groups name module.module.decoder.layers.41.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.35.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.input_layernorm.weight key (0.0, 0.06561, False, False) name module.module.external_feature_model.vit.decoder.layers.16.mlp.linear_fc2.weight lr_decay_rate 0.4304672100000001_get_param_groups name module.module.decoder.layers.38.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.input_layernorm.weight key (0.0, 0.03874204890000001, False, False) _get_param_groups name module.module.decoder.layers.3.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.42.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.37.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.31.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.37.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.0.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.self_attention.linear_proj.bias key (0.0, 0.016677181699666577, False, False) _get_param_groups name module.module.decoder.layers.25.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.mlp.linear_fc2.weight key (1.0, 0.04304672100000001, False, False)_get_param_groups name module.module.decoder.layers.42.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.39.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.35.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.20.input_layernorm.bias lr_decay_rate 0.6561_get_param_groups name module.module.decoder.layers.42.input_layernorm.weight key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.15.input_layernorm.bias lr_decay_rate 0.3874204890000001 _get_param_groups name module.module.decoder.layers.3.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.37.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.42.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.37.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.42.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.31.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.0.mlp.linear_fc2.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.7.self_attention.linear_qkv.weight lr_decay_rate 0.16677181699666577_get_param_groups name module.module.decoder.layers.35.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.input_layernorm.bias key (0.0, 0.06561, False, False) _get_param_groups name module.module.decoder.layers.25.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.39.self_attention.linear_proj.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.16.mlp.linear_fc2.bias lr_decay_rate 0.4304672100000001 _get_param_groups name module.module.decoder.layers.3.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.input_layernorm.bias key (0.0, 0.03874204890000001, False, False)_get_param_groups name module.module.decoder.layers.42.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.42.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.37.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.42.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.35.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.37.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.31.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.3.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.self_attention.linear_qkv.weight key (1.0, 0.016677181699666577, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.mlp.linear_fc2.bias key (0.0, 0.04304672100000001, False, False) _get_param_groups name module.module.decoder.layers.25.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.1.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.39.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.20.self_attention.linear_proj.weight lr_decay_rate 0.6561 _get_param_groups name module.module.decoder.layers.42.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.43.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.42.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.37.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.38.input_layernorm.weight key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.15.self_attention.linear_proj.weight lr_decay_rate 0.3874204890000001_get_param_groups name module.module.decoder.layers.31.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.35.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.3.mlp.linear_fc1.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.17.ls1 lr_decay_rate 0.4782969000000001name module.module.external_feature_model.vit.decoder.layers.7.self_attention.linear_qkv.bias lr_decay_rate 0.16677181699666577_get_param_groups name module.module.decoder.layers.25.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.42.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.1.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.39.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.self_attention.linear_proj.weight key (1.0, 0.06561, False, False) _get_param_groups name module.module.decoder.layers.38.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.self_attention.linear_qkv.bias key (0.0, 0.016677181699666577, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.self_attention.linear_proj.weight key (1.0, 0.03874204890000001, False, False)_get_param_groups name module.module.decoder.layers.43.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.43.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.35.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.32.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.37.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.ls1 key (0.0, 0.04782969000000001, False, False)_get_param_groups name module.module.decoder.layers.3.mlp.linear_fc2.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.20.self_attention.linear_proj.bias lr_decay_rate 0.6561 _get_param_groups name module.module.decoder.layers.1.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.25.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.42.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.39.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.self_attention.linear_proj.bias key (0.0, 0.06561, False, False)_get_param_groups name module.module.decoder.layers.38.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.17.ls2 lr_decay_rate 0.4782969000000001 _get_param_groups name module.module.decoder.layers.43.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.36.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.43.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.32.self_attention.linear_proj.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.7.pre_mlp_layernorm.weight lr_decay_rate 0.16677181699666577name module.module.external_feature_model.vit.decoder.layers.15.self_attention.linear_proj.bias lr_decay_rate 0.3874204890000001 _get_param_groups name module.module.decoder.layers.1.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.37.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.4.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.38.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.39.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.42.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.ls2 key (0.0, 0.04782969000000001, False, False)_get_param_groups name module.module.decoder.layers.43.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.36.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.26.input_layernorm.weight key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.20.self_attention.linear_qkv.weight lr_decay_rate 0.6561 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.self_attention.linear_proj.bias key (0.0, 0.03874204890000001, False, False) _get_param_groups name module.module.decoder.layers.43.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.32.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.pre_mlp_layernorm.weight key (0.0, 0.016677181699666577, False, False) name module.module.external_feature_model.vit.decoder.layers.17.input_layernorm.weight lr_decay_rate 0.4782969000000001_get_param_groups name module.module.decoder.layers.37.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.1.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.self_attention.linear_qkv.weight key (1.0, 0.06561, False, False) _get_param_groups name module.module.decoder.layers.39.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.42.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.26.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.43.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.36.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.38.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.4.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.32.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.43.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.7.pre_mlp_layernorm.bias lr_decay_rate 0.16677181699666577 name module.module.external_feature_model.vit.decoder.layers.15.self_attention.linear_qkv.weight lr_decay_rate 0.3874204890000001 _get_param_groups name module.module.decoder.layers.38.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.input_layernorm.weight key (0.0, 0.04782969000000001, False, False)_get_param_groups name module.module.decoder.layers.43.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.36.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.20.self_attention.linear_qkv.bias lr_decay_rate 0.6561_get_param_groups name module.module.decoder.layers.40.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.1.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.26.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.43.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.38.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.4.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.pre_mlp_layernorm.bias key (0.0, 0.016677181699666577, False, False) _get_param_groups name module.module.decoder.layers.43.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.self_attention.linear_qkv.weight key (1.0, 0.03874204890000001, False, False)_get_param_groups name module.module.decoder.layers.32.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.43.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.38.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.self_attention.linear_qkv.bias key (0.0, 0.06561, False, False)_get_param_groups name module.module.decoder.layers.40.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.1.mlp.linear_fc2.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.17.input_layernorm.bias lr_decay_rate 0.4782969000000001_get_param_groups name module.module.decoder.layers.38.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.4.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.26.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.36.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.43.mlp.linear_fc1.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.7.mlp.linear_fc1.weight lr_decay_rate 0.16677181699666577 _get_param_groups name module.module.decoder.layers.32.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.43.mlp.linear_fc2.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.15.self_attention.linear_qkv.bias lr_decay_rate 0.3874204890000001 _get_param_groups name module.module.decoder.layers.39.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.43.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.40.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.38.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.input_layernorm.bias key (0.0, 0.04782969000000001, False, False) _get_param_groups name module.module.decoder.layers.36.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.2.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.mlp.linear_fc1.weight key (1.0, 0.016677181699666577, False, False)name module.module.external_feature_model.vit.decoder.layers.20.pre_mlp_layernorm.weight lr_decay_rate 0.6561 _get_param_groups name module.module.decoder.layers.4.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.43.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.self_attention.linear_qkv.bias key (0.0, 0.03874204890000001, False, False)_get_param_groups name module.module.decoder.layers.32.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.26.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.44.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.43.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.40.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.36.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.39.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.38.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.7.mlp.linear_fc1.bias lr_decay_rate 0.16677181699666577 name module.module.external_feature_model.vit.decoder.layers.17.self_attention.linear_proj.weight lr_decay_rate 0.4782969000000001 _get_param_groups name module.module.decoder.layers.2.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.pre_mlp_layernorm.weight key (0.0, 0.06561, False, False)_get_param_groups name module.module.decoder.layers.33.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.4.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.26.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.44.input_layernorm.weight key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.15.pre_mlp_layernorm.weight lr_decay_rate 0.3874204890000001 _get_param_groups name module.module.decoder.layers.39.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.37.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.43.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.self_attention.linear_proj.weight key (1.0, 0.04782969000000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.mlp.linear_fc1.bias key (0.0, 0.016677181699666577, False, False)_get_param_groups name module.module.decoder.layers.44.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.40.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.4.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.38.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.2.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.33.self_attention.linear_proj.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.20.pre_mlp_layernorm.bias lr_decay_rate 0.6561 _get_param_groups name module.module.decoder.layers.26.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.39.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.pre_mlp_layernorm.weight key (0.0, 0.03874204890000001, False, False) _get_param_groups name module.module.decoder.layers.44.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.37.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.44.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.17.self_attention.linear_proj.bias lr_decay_rate 0.4782969000000001 name module.module.external_feature_model.vit.decoder.layers.7.mlp.linear_fc2.weight lr_decay_rate 0.16677181699666577_get_param_groups name module.module.decoder.layers.2.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.43.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.40.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.27.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.pre_mlp_layernorm.bias key (0.0, 0.06561, False, False) _get_param_groups name module.module.decoder.layers.5.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.33.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.38.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.44.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.15.pre_mlp_layernorm.bias lr_decay_rate 0.3874204890000001 _get_param_groups name module.module.decoder.layers.44.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.37.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.39.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.self_attention.linear_proj.bias key (0.0, 0.04782969000000001, False, False) _get_param_groups name module.module.decoder.layers.43.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.mlp.linear_fc2.weight key (1.0, 0.016677181699666577, False, False) _get_param_groups name module.module.decoder.layers.40.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.33.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.27.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.2.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.39.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.pre_mlp_layernorm.bias key (0.0, 0.03874204890000001, False, False)name module.module.external_feature_model.vit.decoder.layers.20.mlp.linear_fc1.weight lr_decay_rate 0.6561_get_param_groups name module.module.decoder.layers.5.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.38.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.44.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.37.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.7.mlp.linear_fc2.bias lr_decay_rate 0.16677181699666577 _get_param_groups name module.module.decoder.layers.44.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.41.input_layernorm.weight key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.17.self_attention.linear_qkv.weight lr_decay_rate 0.4782969000000001 _get_param_groups name module.module.decoder.layers.44.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.2.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.mlp.linear_fc1.weight key (1.0, 0.06561, False, False)_get_param_groups name module.module.decoder.layers.33.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.39.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.27.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.5.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.15.mlp.linear_fc1.weight lr_decay_rate 0.3874204890000001 _get_param_groups name module.module.decoder.layers.39.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.37.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.7.mlp.linear_fc2.bias key (0.0, 0.016677181699666577, False, False) _get_param_groups name module.module.decoder.layers.44.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.41.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.44.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.self_attention.linear_qkv.weight key (1.0, 0.04782969000000001, False, False) _get_param_groups name module.module.decoder.layers.27.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.2.mlp.linear_fc2.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.20.mlp.linear_fc1.bias lr_decay_rate 0.6561 _get_param_groups name module.module.decoder.layers.33.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.44.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.40.input_layernorm.weight key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.8.ls1 lr_decay_rate 0.18530201888518416 _get_param_groups name module.module.decoder.layers.5.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.37.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.mlp.linear_fc1.weight key (1.0, 0.03874204890000001, False, False)_get_param_groups name module.module.decoder.layers.44.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.39.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.41.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.44.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.33.mlp.linear_fc2.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.17.self_attention.linear_qkv.bias lr_decay_rate 0.4782969000000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.mlp.linear_fc1.bias key (0.0, 0.06561, False, False)_get_param_groups name module.module.decoder.layers.27.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.3.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.40.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.ls1 key (0.0, 0.018530201888518418, False, False)name module.module.external_feature_model.vit.decoder.layers.15.mlp.linear_fc1.bias lr_decay_rate 0.3874204890000001_get_param_groups name module.module.decoder.layers.44.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.5.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.37.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.41.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.45.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.39.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.34.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.44.mlp.linear_fc2.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.20.mlp.linear_fc2.weight lr_decay_rate 0.6561 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.self_attention.linear_qkv.bias key (0.0, 0.04782969000000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.mlp.linear_fc1.bias key (0.0, 0.03874204890000001, False, False) name module.module.external_feature_model.vit.decoder.layers.8.ls2 lr_decay_rate 0.18530201888518416 _get_param_groups name module.module.decoder.layers.40.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.27.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.44.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.5.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.38.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.39.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.3.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.mlp.linear_fc2.weight key (1.0, 0.06561, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.ls2 key (0.0, 0.018530201888518418, False, False)_get_param_groups name module.module.decoder.layers.41.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.45.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.45.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.34.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.40.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.15.mlp.linear_fc2.weight lr_decay_rate 0.3874204890000001 _get_param_groups name module.module.decoder.layers.27.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.5.mlp.linear_fc2.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.17.pre_mlp_layernorm.weight lr_decay_rate 0.4782969000000001_get_param_groups name module.module.decoder.layers.44.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.20.mlp.linear_fc2.bias lr_decay_rate 0.6561 _get_param_groups name module.module.decoder.layers.38.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.41.mlp.linear_fc1.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.8.input_layernorm.weight lr_decay_rate 0.18530201888518416_get_param_groups name module.module.decoder.layers.3.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.39.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.45.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.34.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.mlp.linear_fc2.weight key (1.0, 0.03874204890000001, False, False)_get_param_groups name module.module.decoder.layers.45.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.28.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.pre_mlp_layernorm.weight key (0.0, 0.04782969000000001, False, False) _get_param_groups name module.module.decoder.layers.40.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.44.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.mlp.linear_fc2.bias key (0.0, 0.06561, False, False)_get_param_groups name module.module.decoder.layers.6.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.input_layernorm.weight key (0.0, 0.018530201888518418, False, False) _get_param_groups name module.module.decoder.layers.38.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.45.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.41.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.3.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.15.mlp.linear_fc2.bias lr_decay_rate 0.3874204890000001 name module.module.external_feature_model.vit.decoder.layers.17.pre_mlp_layernorm.bias lr_decay_rate 0.4782969000000001_get_param_groups name module.module.decoder.layers.39.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.34.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.45.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.40.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.44.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.28.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.45.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.38.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.8.input_layernorm.bias lr_decay_rate 0.18530201888518416_get_param_groups name module.module.decoder.layers.39.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.3.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.21.ls1 lr_decay_rate 0.7290000000000001_get_param_groups name module.module.decoder.layers.6.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.42.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.45.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.mlp.linear_fc2.bias key (0.0, 0.03874204890000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.pre_mlp_layernorm.bias key (0.0, 0.04782969000000001, False, False) _get_param_groups name module.module.decoder.layers.28.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.40.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.34.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.45.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.input_layernorm.bias key (0.0, 0.018530201888518418, False, False) _get_param_groups name module.module.decoder.layers.45.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.ls1 key (0.0, 0.0729, False, False) _get_param_groups name module.module.decoder.layers.3.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.6.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.45.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.38.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.40.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.42.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.28.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.17.mlp.linear_fc1.weight lr_decay_rate 0.4782969000000001_get_param_groups name module.module.decoder.layers.34.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.6.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.41.input_layernorm.weight key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.16.ls1 lr_decay_rate 0.4304672100000001 _get_param_groups name module.module.decoder.layers.45.mlp.linear_fc2.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.21.ls2 lr_decay_rate 0.7290000000000001_get_param_groups name module.module.decoder.layers.3.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.45.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.42.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.8.self_attention.linear_proj.weight lr_decay_rate 0.18530201888518416_get_param_groups name module.module.decoder.layers.38.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.45.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.34.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.mlp.linear_fc1.weight key (1.0, 0.04782969000000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.ls1 key (0.0, 0.04304672100000001, False, False)_get_param_groups name module.module.decoder.layers.40.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.28.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.41.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.4.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.ls2 key (0.0, 0.0729, False, False)_get_param_groups name module.module.decoder.layers.6.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.46.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.45.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.45.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.42.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.self_attention.linear_proj.weight key (1.0, 0.018530201888518418, False, False) name module.module.external_feature_model.vit.decoder.layers.17.mlp.linear_fc1.bias lr_decay_rate 0.4782969000000001 _get_param_groups name module.module.decoder.layers.38.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.35.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.28.mlp.linear_fc1.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.16.ls2 lr_decay_rate 0.4304672100000001 _get_param_groups name module.module.decoder.layers.40.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.41.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.21.input_layernorm.weight lr_decay_rate 0.7290000000000001 _get_param_groups name module.module.decoder.layers.45.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.46.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.42.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.46.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.6.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.4.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.mlp.linear_fc1.bias key (0.0, 0.04782969000000001, False, False)name module.module.external_feature_model.vit.decoder.layers.8.self_attention.linear_proj.bias lr_decay_rate 0.18530201888518416 _get_param_groups name module.module.decoder.layers.39.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.28.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.35.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.40.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.ls2 key (0.0, 0.04304672100000001, False, False) _get_param_groups name module.module.decoder.layers.46.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.input_layernorm.weight key (0.0, 0.0729, False, False) _get_param_groups name module.module.decoder.layers.41.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.6.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.42.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.46.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.self_attention.linear_proj.bias key (0.0, 0.018530201888518418, False, False)_get_param_groups name module.module.decoder.layers.35.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.4.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.45.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.17.mlp.linear_fc2.weight lr_decay_rate 0.4782969000000001_get_param_groups name module.module.decoder.layers.46.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.29.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.39.self_attention.linear_proj.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.16.input_layernorm.weight lr_decay_rate 0.4304672100000001_get_param_groups name module.module.decoder.layers.42.mlp.linear_fc2.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.21.input_layernorm.bias lr_decay_rate 0.7290000000000001_get_param_groups name module.module.decoder.layers.41.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.40.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.7.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.35.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.4.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.46.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.8.self_attention.linear_qkv.weight lr_decay_rate 0.18530201888518416 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.mlp.linear_fc2.weight key (1.0, 0.04782969000000001, False, False)_get_param_groups name module.module.decoder.layers.45.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.41.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.46.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.29.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.input_layernorm.bias key (0.0, 0.0729, False, False) _get_param_groups name module.module.decoder.layers.39.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.input_layernorm.weight key (0.0, 0.04304672100000001, False, False) _get_param_groups name module.module.decoder.layers.40.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.43.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.45.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.self_attention.linear_qkv.weight key (1.0, 0.018530201888518418, False, False)_get_param_groups name module.module.decoder.layers.46.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.17.mlp.linear_fc2.bias lr_decay_rate 0.4782969000000001 _get_param_groups name module.module.decoder.layers.7.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.35.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.4.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.46.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.29.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.40.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.41.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.39.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.16.input_layernorm.bias lr_decay_rate 0.4304672100000001name module.module.external_feature_model.vit.decoder.layers.21.self_attention.linear_proj.weight lr_decay_rate 0.7290000000000001_get_param_groups name module.module.decoder.layers.43.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.mlp.linear_fc2.bias key (0.0, 0.04782969000000001, False, False)name module.module.external_feature_model.vit.decoder.layers.8.self_attention.linear_qkv.bias lr_decay_rate 0.18530201888518416_get_param_groups name module.module.decoder.layers.46.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.29.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.46.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.46.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.41.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.7.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.35.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.4.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.input_layernorm.bias key (0.0, 0.04304672100000001, False, False) _get_param_groups name module.module.decoder.layers.39.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.42.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.43.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.self_attention.linear_proj.weight key (1.0, 0.0729, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.self_attention.linear_qkv.bias key (0.0, 0.018530201888518418, False, False) _get_param_groups name module.module.decoder.layers.46.mlp.linear_fc1.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.18.ls1 lr_decay_rate 0.531441 _get_param_groups name module.module.decoder.layers.46.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.29.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.7.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.35.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.4.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.41.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.43.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.39.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.42.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.47.input_layernorm.weight key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.21.self_attention.linear_proj.bias lr_decay_rate 0.7290000000000001_get_param_groups name module.module.decoder.layers.46.mlp.linear_fc2.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.8.pre_mlp_layernorm.weight lr_decay_rate 0.18530201888518416_get_param_groups name module.module.decoder.layers.46.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.ls1 key (0.0, 0.05314410000000001, False, False)_get_param_groups name module.module.decoder.layers.29.mlp.linear_fc1.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.16.self_attention.linear_proj.weight lr_decay_rate 0.4304672100000001_get_param_groups name module.module.decoder.layers.36.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.7.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.5.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.41.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.43.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.42.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.39.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.self_attention.linear_proj.bias key (0.0, 0.0729, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.self_attention.linear_proj.weight key (1.0, 0.04304672100000001, False, False) _get_param_groups name module.module.decoder.layers.46.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.7.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.47.self_attention.linear_proj.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.18.ls2 lr_decay_rate 0.531441_get_param_groups name module.module.decoder.layers.29.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.pre_mlp_layernorm.weight key (0.0, 0.018530201888518418, False, False) _get_param_groups name module.module.decoder.layers.36.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.43.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.47.input_layernorm.weight key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.21.self_attention.linear_qkv.weight lr_decay_rate 0.7290000000000001_get_param_groups name module.module.decoder.layers.41.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.5.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.42.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.16.self_attention.linear_proj.bias lr_decay_rate 0.4304672100000001 name module.module.external_feature_model.vit.decoder.layers.8.pre_mlp_layernorm.bias lr_decay_rate 0.18530201888518416_get_param_groups name module.module.decoder.layers.40.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.ls2 key (0.0, 0.05314410000000001, False, False) _get_param_groups name module.module.decoder.layers.47.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.7.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.5.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.46.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.30.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.36.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.43.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.self_attention.linear_proj.bias key (0.0, 0.04304672100000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.self_attention.linear_qkv.weight key (1.0, 0.0729, False, False)_get_param_groups name module.module.decoder.layers.42.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.47.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.47.self_attention.linear_proj.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.18.input_layernorm.weight lr_decay_rate 0.531441_get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.pre_mlp_layernorm.bias key (0.0, 0.018530201888518418, False, False)_get_param_groups name module.module.decoder.layers.40.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.8.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.5.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.36.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.41.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.46.mlp.linear_fc1.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.21.self_attention.linear_qkv.bias lr_decay_rate 0.7290000000000001_get_param_groups name module.module.decoder.layers.30.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.44.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.47.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.16.self_attention.linear_qkv.weight lr_decay_rate 0.4304672100000001 _get_param_groups name module.module.decoder.layers.47.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.42.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.input_layernorm.weight key (0.0, 0.05314410000000001, False, False)_get_param_groups name module.module.decoder.layers.40.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.8.mlp.linear_fc1.weight lr_decay_rate 0.18530201888518416_get_param_groups name module.module.decoder.layers.8.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.self_attention.linear_qkv.bias key (0.0, 0.0729, False, False) _get_param_groups name module.module.decoder.layers.30.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.41.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.46.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.self_attention.linear_qkv.weight key (1.0, 0.04304672100000001, False, False) _get_param_groups name module.module.decoder.layers.36.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.5.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.44.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.47.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.47.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.40.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.42.mlp.linear_fc2.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.18.input_layernorm.bias lr_decay_rate 0.531441 _get_param_groups name module.module.decoder.layers.8.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.30.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.mlp.linear_fc1.weight key (1.0, 0.018530201888518418, False, False) _get_param_groups name module.module.decoder.layers.36.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.41.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.input_layernorm.bias key (0.0, 0.05314410000000001, False, False) _get_param_groups name module.module.decoder.layers.44.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.21.pre_mlp_layernorm.weight lr_decay_rate 0.7290000000000001name module.module.external_feature_model.vit.decoder.layers.16.self_attention.linear_qkv.bias lr_decay_rate 0.4304672100000001 _get_param_groups name module.module.decoder.layers.47.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.5.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.43.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.47.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.8.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.36.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.47.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.40.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.8.mlp.linear_fc1.bias lr_decay_rate 0.18530201888518416_get_param_groups name module.module.decoder.layers.30.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.final_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.42.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.44.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.18.self_attention.linear_proj.weight lr_decay_rate 0.531441 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.pre_mlp_layernorm.weight key (0.0, 0.0729, False, False)_get_param_groups name module.module.decoder.layers.47.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.self_attention.linear_qkv.bias key (0.0, 0.04304672100000001, False, False)_get_param_groups name module.module.decoder.layers.5.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.8.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.mlp.linear_fc1.bias key (0.0, 0.018530201888518418, False, False)_get_param_groups name module.module.decoder.layers.43.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.47.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.37.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.30.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.40.mlp.linear_fc1.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.21.pre_mlp_layernorm.bias lr_decay_rate 0.7290000000000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.self_attention.linear_proj.weight key (1.0, 0.05314410000000001, False, False) _get_param_groups name module.module.decoder.layers.44.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.output_layer.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.47.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.42.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.6.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.8.mlp.linear_fc1.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.16.pre_mlp_layernorm.weight lr_decay_rate 0.4304672100000001 _get_param_groups name module.module.decoder.layers.43.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.37.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.40.mlp.linear_fc2.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.8.mlp.linear_fc2.weight lr_decay_rate 0.18530201888518416 _get_param_groups name module.module.decoder.layers.47.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.pre_mlp_layernorm.bias key (0.0, 0.0729, False, False)_get_param_groups name module.module.decoder.layers.30.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.44.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.final_layernorm.weight key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.18.self_attention.linear_proj.bias lr_decay_rate 0.531441 _get_param_groups name module.module.decoder.layers.8.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.pre_mlp_layernorm.weight key (0.0, 0.04304672100000001, False, False)_get_param_groups name module.module.decoder.layers.6.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.42.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.37.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.43.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.mlp.linear_fc2.weight key (1.0, 0.018530201888518418, False, False)_get_param_groups name module.module.decoder.layers.47.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.44.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.41.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.self_attention.linear_proj.bias key (0.0, 0.05314410000000001, False, False)_get_param_groups name module.module.decoder.layers.31.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.9.input_layernorm.weight key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.21.mlp.linear_fc1.weight lr_decay_rate 0.7290000000000001_get_param_groups name module.module.output_layer.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.6.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.42.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.16.pre_mlp_layernorm.bias lr_decay_rate 0.4304672100000001 _get_param_groups name module.module.decoder.layers.37.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.43.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.8.mlp.linear_fc2.bias lr_decay_rate 0.18530201888518416 _get_param_groups name module.module.decoder.layers.45.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.47.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.9.self_attention.linear_proj.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.18.self_attention.linear_qkv.weight lr_decay_rate 0.531441 _get_param_groups name module.module.decoder.layers.41.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.pre_mlp_layernorm.bias key (0.0, 0.04304672100000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.mlp.linear_fc1.weight key (1.0, 0.0729, False, False)_get_param_groups name module.module.decoder.layers.6.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.31.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.8.mlp.linear_fc2.bias key (0.0, 0.018530201888518418, False, False)_get_param_groups name module.module.decoder.layers.37.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.43.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.42.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.9.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.self_attention.linear_qkv.weight key (1.0, 0.05314410000000001, False, False) _get_param_groups name module.module.decoder.layers.47.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.45.self_attention.linear_proj.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.21.mlp.linear_fc1.bias lr_decay_rate 0.7290000000000001 _get_param_groups name module.module.decoder.layers.41.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.6.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.31.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.16.mlp.linear_fc1.weight lr_decay_rate 0.4304672100000001_get_param_groups name module.module.decoder.layers.9.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.42.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.37.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.43.mlp.linear_fc2.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.9.ls1 lr_decay_rate 0.20589113209464907name module.module.external_feature_model.vit.decoder.layers.18.self_attention.linear_qkv.bias lr_decay_rate 0.531441 _get_param_groups name module.module.decoder.layers.47.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.mlp.linear_fc1.bias key (0.0, 0.0729, False, False) _get_param_groups name module.module.decoder.layers.45.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.41.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.6.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.self_attention.linear_qkv.bias key (0.0, 0.05314410000000001, False, False) _get_param_groups name module.module.decoder.layers.31.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.ls1 key (0.0, 0.02058911320946491, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.mlp.linear_fc1.weight key (1.0, 0.04304672100000001, False, False) _get_param_groups name module.module.decoder.final_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.42.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.9.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.37.mlp.linear_fc2.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.21.mlp.linear_fc2.weight lr_decay_rate 0.7290000000000001_get_param_groups name module.module.decoder.layers.45.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.44.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.6.mlp.linear_fc2.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.9.ls2 lr_decay_rate 0.20589113209464907name module.module.external_feature_model.vit.decoder.layers.16.mlp.linear_fc1.bias lr_decay_rate 0.4304672100000001_get_param_groups name module.module.decoder.layers.41.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.18.pre_mlp_layernorm.weight lr_decay_rate 0.531441 _get_param_groups name module.module.decoder.layers.31.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.43.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.output_layer.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.mlp.linear_fc2.weight key (1.0, 0.0729, False, False)_get_param_groups name module.module.decoder.layers.9.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.38.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.ls2 key (0.0, 0.02058911320946491, False, False) _get_param_groups name module.module.decoder.layers.45.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.7.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.44.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.pre_mlp_layernorm.weight key (0.0, 0.05314410000000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.mlp.linear_fc1.bias key (0.0, 0.04304672100000001, False, False)_get_param_groups name module.module.decoder.layers.41.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.31.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.43.self_attention.linear_proj.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.21.mlp.linear_fc2.bias lr_decay_rate 0.7290000000000001_get_param_groups name module.module.decoder.layers.9.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.45.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.38.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.7.self_attention.linear_proj.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.9.input_layernorm.weight lr_decay_rate 0.20589113209464907 _get_param_groups name module.module.decoder.layers.44.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.18.pre_mlp_layernorm.bias lr_decay_rate 0.531441 name module.module.external_feature_model.vit.decoder.layers.16.mlp.linear_fc2.weight lr_decay_rate 0.4304672100000001_get_param_groups name module.module.decoder.layers.41.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.31.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.mlp.linear_fc2.bias key (0.0, 0.0729, False, False) _get_param_groups name module.module.decoder.layers.43.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.45.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.pre_mlp_layernorm.bias key (0.0, 0.05314410000000001, False, False)_get_param_groups name module.module.decoder.layers.38.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.10.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.input_layernorm.weight key (0.0, 0.02058911320946491, False, False)_get_param_groups name module.module.decoder.layers.7.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.44.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.mlp.linear_fc2.weight key (1.0, 0.04304672100000001, False, False) _get_param_groups name module.module.decoder.layers.42.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.32.input_layernorm.weight key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.22.ls1 lr_decay_rate 0.81 _get_param_groups name module.module.decoder.layers.43.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.46.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.38.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.44.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.7.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.9.input_layernorm.bias lr_decay_rate 0.20589113209464907 name module.module.external_feature_model.vit.decoder.layers.18.mlp.linear_fc1.weight lr_decay_rate 0.531441 name module.module.external_feature_model.vit.decoder.layers.16.mlp.linear_fc2.bias lr_decay_rate 0.4304672100000001_get_param_groups name module.module.decoder.layers.10.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.42.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.ls1 key (0.0, 0.08100000000000002, False, False) _get_param_groups name module.module.decoder.layers.32.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.46.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.input_layernorm.bias key (0.0, 0.02058911320946491, False, False)_get_param_groups name module.module.decoder.layers.44.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.43.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.mlp.linear_fc2.bias key (0.0, 0.04304672100000001, False, False)_get_param_groups name module.module.decoder.layers.38.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.mlp.linear_fc1.weight key (1.0, 0.05314410000000001, False, False)_get_param_groups name module.module.decoder.layers.42.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.10.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.7.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.22.ls2 lr_decay_rate 0.81 _get_param_groups name module.module.decoder.layers.32.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.44.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.46.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.38.mlp.linear_fc1.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.9.self_attention.linear_proj.weight lr_decay_rate 0.20589113209464907 _get_param_groups name module.module.decoder.layers.10.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.42.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.18.mlp.linear_fc1.bias lr_decay_rate 0.531441 _get_param_groups name module.module.decoder.layers.43.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.ls2 key (0.0, 0.08100000000000002, False, False)_get_param_groups name module.module.decoder.layers.7.mlp.linear_fc1.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.17.ls1 lr_decay_rate 0.4782969000000001_get_param_groups name module.module.decoder.layers.32.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.45.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.self_attention.linear_proj.weight key (1.0, 0.02058911320946491, False, False) _get_param_groups name module.module.decoder.layers.46.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.38.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.mlp.linear_fc1.bias key (0.0, 0.05314410000000001, False, False) _get_param_groups name module.module.decoder.layers.10.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.43.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.42.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.22.input_layernorm.weight lr_decay_rate 0.81_get_param_groups name module.module.decoder.layers.7.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.ls1 key (0.0, 0.04782969000000001, False, False) _get_param_groups name module.module.decoder.layers.45.self_attention.linear_proj.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.9.self_attention.linear_proj.bias lr_decay_rate 0.20589113209464907 _get_param_groups name module.module.decoder.layers.32.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.39.input_layernorm.weight key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.18.mlp.linear_fc2.weight lr_decay_rate 0.531441 _get_param_groups name module.module.decoder.layers.46.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.42.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.10.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.input_layernorm.weight key (0.0, 0.08100000000000002, False, False) name module.module.external_feature_model.vit.decoder.layers.17.ls2 lr_decay_rate 0.4782969000000001_get_param_groups name module.module.decoder.layers.44.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.self_attention.linear_proj.bias key (0.0, 0.02058911320946491, False, False) _get_param_groups name module.module.decoder.layers.8.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.45.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.mlp.linear_fc2.weight key (1.0, 0.05314410000000001, False, False)_get_param_groups name module.module.decoder.layers.32.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.42.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.39.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.46.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.ls2 key (0.0, 0.04782969000000001, False, False) _get_param_groups name module.module.decoder.layers.45.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.10.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.8.self_attention.linear_proj.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.22.input_layernorm.bias lr_decay_rate 0.81name module.module.external_feature_model.vit.decoder.layers.9.self_attention.linear_qkv.weight lr_decay_rate 0.20589113209464907 name module.module.external_feature_model.vit.decoder.layers.18.mlp.linear_fc2.bias lr_decay_rate 0.531441_get_param_groups name module.module.decoder.layers.32.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.44.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.46.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.43.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.39.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.8.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.17.input_layernorm.weight lr_decay_rate 0.4782969000000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.input_layernorm.bias key (0.0, 0.08100000000000002, False, False) _get_param_groups name module.module.decoder.layers.11.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.self_attention.linear_qkv.weight key (1.0, 0.02058911320946491, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.mlp.linear_fc2.bias key (0.0, 0.05314410000000001, False, False)_get_param_groups name module.module.decoder.layers.45.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.33.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.39.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.44.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.8.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.43.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.input_layernorm.weight key (0.0, 0.04782969000000001, False, False) name module.module.external_feature_model.vit.decoder.layers.9.self_attention.linear_qkv.bias lr_decay_rate 0.20589113209464907_get_param_groups name module.module.decoder.layers.45.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.11.self_attention.linear_proj.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.22.self_attention.linear_proj.weight lr_decay_rate 0.81name module.module.external_feature_model.vit.decoder.layers.19.ls1 lr_decay_rate 0.5904900000000001 _get_param_groups name module.module.decoder.layers.47.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.44.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.33.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.43.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.17.input_layernorm.bias lr_decay_rate 0.4782969000000001_get_param_groups name module.module.decoder.layers.39.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.self_attention.linear_qkv.bias key (0.0, 0.02058911320946491, False, False)_get_param_groups name module.module.decoder.layers.11.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.ls1 key (0.0, 0.05904900000000001, False, False)_get_param_groups name module.module.decoder.layers.45.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.8.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.self_attention.linear_proj.weight key (1.0, 0.08100000000000002, False, False) _get_param_groups name module.module.decoder.layers.47.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.43.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.33.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.44.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.11.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.input_layernorm.bias key (0.0, 0.04782969000000001, False, False)_get_param_groups name module.module.decoder.layers.39.mlp.linear_fc1.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.19.ls2 lr_decay_rate 0.5904900000000001 _get_param_groups name module.module.decoder.layers.8.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.47.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.46.input_layernorm.weight key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.9.pre_mlp_layernorm.weight lr_decay_rate 0.20589113209464907 _get_param_groups name module.module.decoder.layers.33.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.22.self_attention.linear_proj.bias lr_decay_rate 0.81 _get_param_groups name module.module.decoder.layers.44.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.43.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.ls2 key (0.0, 0.05904900000000001, False, False)_get_param_groups name module.module.decoder.layers.39.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.8.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.11.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.pre_mlp_layernorm.weight key (0.0, 0.02058911320946491, False, False) _get_param_groups name module.module.decoder.layers.47.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.17.self_attention.linear_proj.weight lr_decay_rate 0.4782969000000001_get_param_groups name module.module.decoder.layers.46.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.self_attention.linear_proj.bias key (0.0, 0.08100000000000002, False, False) _get_param_groups name module.module.decoder.layers.33.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.44.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.43.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.40.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.9.input_layernorm.weight key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.19.input_layernorm.weight lr_decay_rate 0.5904900000000001_get_param_groups name module.module.decoder.layers.11.mlp.linear_fc1.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.9.pre_mlp_layernorm.bias lr_decay_rate 0.20589113209464907 _get_param_groups name module.module.decoder.layers.47.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.self_attention.linear_proj.weight key (1.0, 0.04782969000000001, False, False) _get_param_groups name module.module.decoder.layers.46.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.22.self_attention.linear_qkv.weight lr_decay_rate 0.81 _get_param_groups name module.module.decoder.layers.33.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.input_layernorm.weight key (0.0, 0.05904900000000001, False, False)_get_param_groups name module.module.decoder.layers.45.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.43.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.40.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.pre_mlp_layernorm.bias key (0.0, 0.02058911320946491, False, False) _get_param_groups name module.module.decoder.layers.11.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.self_attention.linear_qkv.weight key (1.0, 0.08100000000000002, False, False) _get_param_groups name module.module.decoder.layers.47.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.9.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.46.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.17.self_attention.linear_proj.bias lr_decay_rate 0.4782969000000001 _get_param_groups name module.module.decoder.layers.33.mlp.linear_fc2.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.19.input_layernorm.bias lr_decay_rate 0.5904900000000001 _get_param_groups name module.module.decoder.layers.40.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.45.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.44.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.self_attention.linear_proj.bias key (0.0, 0.04782969000000001, False, False)_get_param_groups name module.module.decoder.layers.47.mlp.linear_fc2.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.22.self_attention.linear_qkv.bias lr_decay_rate 0.81 _get_param_groups name module.module.decoder.layers.12.input_layernorm.weight key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.9.mlp.linear_fc1.weight lr_decay_rate 0.20589113209464907 _get_param_groups name module.module.decoder.layers.9.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.input_layernorm.bias key (0.0, 0.05904900000000001, False, False) _get_param_groups name module.module.decoder.layers.46.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.34.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.40.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.45.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.44.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.self_attention.linear_qkv.bias key (0.0, 0.08100000000000002, False, False)_get_param_groups name module.module.decoder.final_layernorm.weight key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.17.self_attention.linear_qkv.weight lr_decay_rate 0.4782969000000001_get_param_groups name module.module.decoder.layers.9.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.mlp.linear_fc1.weight key (1.0, 0.02058911320946491, False, False) _get_param_groups name module.module.decoder.layers.46.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.12.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.45.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.19.self_attention.linear_proj.weight lr_decay_rate 0.5904900000000001_get_param_groups name module.module.decoder.layers.34.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.44.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.self_attention.linear_qkv.weight key (1.0, 0.04782969000000001, False, False)_get_param_groups name module.module.decoder.layers.40.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.46.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.output_layer.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.9.mlp.linear_fc1.bias lr_decay_rate 0.20589113209464907 name module.module.external_feature_model.vit.decoder.layers.22.pre_mlp_layernorm.weight lr_decay_rate 0.81_get_param_groups name module.module.decoder.layers.9.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.12.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.45.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.self_attention.linear_proj.weight key (1.0, 0.05904900000000001, False, False) _get_param_groups name module.module.decoder.layers.44.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.34.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.17.self_attention.linear_qkv.bias lr_decay_rate 0.4782969000000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.mlp.linear_fc1.bias key (0.0, 0.02058911320946491, False, False) _get_param_groups name module.module.decoder.layers.12.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.pre_mlp_layernorm.weight key (0.0, 0.08100000000000002, False, False)_get_param_groups name module.module.decoder.layers.40.mlp.linear_fc1.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.19.self_attention.linear_proj.bias lr_decay_rate 0.5904900000000001 _get_param_groups name module.module.decoder.layers.9.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.45.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.47.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.34.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.44.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.self_attention.linear_qkv.bias key (0.0, 0.04782969000000001, False, False) _get_param_groups name module.module.decoder.layers.40.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.self_attention.linear_proj.bias key (0.0, 0.05904900000000001, False, False) name module.module.external_feature_model.vit.decoder.layers.9.mlp.linear_fc2.weight lr_decay_rate 0.20589113209464907 _get_param_groups name module.module.decoder.layers.12.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.9.mlp.linear_fc2.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.22.pre_mlp_layernorm.bias lr_decay_rate 0.81_get_param_groups name module.module.decoder.layers.45.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.47.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.44.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.34.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.mlp.linear_fc2.weight key (1.0, 0.02058911320946491, False, False)_get_param_groups name module.module.decoder.layers.41.input_layernorm.weight key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.19.self_attention.linear_qkv.weight lr_decay_rate 0.5904900000000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.pre_mlp_layernorm.bias key (0.0, 0.08100000000000002, False, False)_get_param_groups name module.module.decoder.layers.10.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.12.mlp.linear_fc1.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.17.pre_mlp_layernorm.weight lr_decay_rate 0.4782969000000001_get_param_groups name module.module.decoder.layers.46.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.47.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.9.mlp.linear_fc2.bias lr_decay_rate 0.20589113209464907 _get_param_groups name module.module.decoder.layers.34.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.44.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.self_attention.linear_qkv.weight key (1.0, 0.05904900000000001, False, False) name module.module.external_feature_model.vit.decoder.layers.22.mlp.linear_fc1.weight lr_decay_rate 0.81 _get_param_groups name module.module.decoder.layers.41.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.12.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.47.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.pre_mlp_layernorm.weight key (0.0, 0.04782969000000001, False, False) _get_param_groups name module.module.decoder.layers.10.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.9.mlp.linear_fc2.bias key (0.0, 0.02058911320946491, False, False)_get_param_groups name module.module.decoder.layers.46.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.mlp.linear_fc1.weight key (1.0, 0.08100000000000002, False, False)name module.module.external_feature_model.vit.decoder.layers.19.self_attention.linear_qkv.bias lr_decay_rate 0.5904900000000001_get_param_groups name module.module.decoder.layers.34.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.45.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.41.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.13.input_layernorm.weight key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.17.pre_mlp_layernorm.bias lr_decay_rate 0.4782969000000001_get_param_groups name module.module.decoder.layers.10.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.47.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.46.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.self_attention.linear_qkv.bias key (0.0, 0.05904900000000001, False, False) name module.module.external_feature_model.vit.decoder.layers.10.ls1 lr_decay_rate 0.2287679245496101 name module.module.external_feature_model.vit.decoder.layers.22.mlp.linear_fc1.bias lr_decay_rate 0.81 _get_param_groups name module.module.decoder.layers.41.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.35.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.pre_mlp_layernorm.bias key (0.0, 0.04782969000000001, False, False) _get_param_groups name module.module.decoder.layers.10.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.13.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.45.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.47.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.46.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.mlp.linear_fc1.bias key (0.0, 0.08100000000000002, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.ls1 key (0.0, 0.02287679245496101, False, False) name module.module.external_feature_model.vit.decoder.layers.19.pre_mlp_layernorm.weight lr_decay_rate 0.5904900000000001 _get_param_groups name module.module.decoder.layers.41.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.13.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.35.self_attention.linear_proj.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.17.mlp.linear_fc1.weight lr_decay_rate 0.4782969000000001_get_param_groups name module.module.decoder.layers.45.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.10.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.47.mlp.linear_fc2.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.22.mlp.linear_fc2.weight lr_decay_rate 0.81 name module.module.external_feature_model.vit.decoder.layers.10.ls2 lr_decay_rate 0.2287679245496101_get_param_groups name module.module.decoder.layers.46.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.pre_mlp_layernorm.weight key (0.0, 0.05904900000000001, False, False) _get_param_groups name module.module.decoder.layers.41.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.13.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.mlp.linear_fc1.weight key (1.0, 0.04782969000000001, False, False)_get_param_groups name module.module.decoder.layers.45.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.35.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.10.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.ls2 key (0.0, 0.02287679245496101, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.mlp.linear_fc2.weight key (1.0, 0.08100000000000002, False, False) name module.module.external_feature_model.vit.decoder.layers.19.pre_mlp_layernorm.bias lr_decay_rate 0.5904900000000001 _get_param_groups name module.module.decoder.layers.46.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.final_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.41.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.13.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.17.mlp.linear_fc1.bias lr_decay_rate 0.4782969000000001_get_param_groups name module.module.decoder.layers.35.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.45.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.10.input_layernorm.weight lr_decay_rate 0.2287679245496101_get_param_groups name module.module.decoder.layers.10.mlp.linear_fc2.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.22.mlp.linear_fc2.bias lr_decay_rate 0.81_get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.pre_mlp_layernorm.bias key (0.0, 0.05904900000000001, False, False) _get_param_groups name module.module.decoder.layers.46.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.output_layer.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.42.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.mlp.linear_fc1.bias key (0.0, 0.04782969000000001, False, False)_get_param_groups name module.module.decoder.layers.13.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.mlp.linear_fc2.bias key (0.0, 0.08100000000000002, False, False) _get_param_groups name module.module.decoder.layers.45.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.11.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.35.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.input_layernorm.weight key (0.0, 0.02287679245496101, False, False)name module.module.external_feature_model.vit.decoder.layers.19.mlp.linear_fc1.weight lr_decay_rate 0.5904900000000001 _get_param_groups name module.module.decoder.layers.13.mlp.linear_fc2.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.17.mlp.linear_fc2.weight lr_decay_rate 0.4782969000000001 _get_param_groups name module.module.decoder.layers.42.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.45.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.mlp.linear_fc1.weight key (1.0, 0.05904900000000001, False, False) name module.module.external_feature_model.vit.decoder.layers.10.input_layernorm.bias lr_decay_rate 0.2287679245496101_get_param_groups name module.module.decoder.layers.35.mlp.linear_fc1.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.23.ls1 lr_decay_rate 0.9_get_param_groups name module.module.decoder.layers.11.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.47.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.14.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.mlp.linear_fc2.weight key (1.0, 0.04782969000000001, False, False)_get_param_groups name module.module.decoder.layers.42.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.19.mlp.linear_fc1.bias lr_decay_rate 0.5904900000000001 _get_param_groups name module.module.decoder.layers.46.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.input_layernorm.bias key (0.0, 0.02287679245496101, False, False) _get_param_groups name module.module.decoder.layers.35.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.11.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.ls1 key (0.0, 0.09000000000000001, False, False) _get_param_groups name module.module.decoder.layers.42.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.47.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.mlp.linear_fc1.bias key (0.0, 0.05904900000000001, False, False) _get_param_groups name module.module.decoder.layers.14.self_attention.linear_proj.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.17.mlp.linear_fc2.bias lr_decay_rate 0.4782969000000001 _get_param_groups name module.module.decoder.layers.11.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.46.self_attention.linear_proj.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.23.ls2 lr_decay_rate 0.9_get_param_groups name module.module.decoder.layers.36.input_layernorm.weight key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.10.self_attention.linear_proj.weight lr_decay_rate 0.2287679245496101 _get_param_groups name module.module.decoder.layers.47.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.42.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.14.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.mlp.linear_fc2.bias key (0.0, 0.04782969000000001, False, False)name module.module.external_feature_model.vit.decoder.layers.19.mlp.linear_fc2.weight lr_decay_rate 0.5904900000000001 _get_param_groups name module.module.decoder.layers.46.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.ls2 key (0.0, 0.09000000000000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.self_attention.linear_proj.weight key (1.0, 0.02287679245496101, False, False)_get_param_groups name module.module.decoder.layers.11.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.47.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.36.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.42.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.14.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.mlp.linear_fc2.weight key (1.0, 0.05904900000000001, False, False)_get_param_groups name module.module.decoder.layers.46.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.18.ls1 lr_decay_rate 0.531441name module.module.external_feature_model.vit.decoder.layers.10.self_attention.linear_proj.bias lr_decay_rate 0.2287679245496101 name module.module.external_feature_model.vit.decoder.layers.23.input_layernorm.weight lr_decay_rate 0.9_get_param_groups name module.module.decoder.layers.11.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.36.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.42.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.47.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.19.mlp.linear_fc2.bias lr_decay_rate 0.5904900000000001_get_param_groups name module.module.decoder.layers.14.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.46.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.self_attention.linear_proj.bias key (0.0, 0.02287679245496101, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.ls1 key (0.0, 0.05314410000000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.input_layernorm.weight key (0.0, 0.09000000000000001, False, False) _get_param_groups name module.module.decoder.layers.11.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.mlp.linear_fc2.bias key (0.0, 0.05904900000000001, False, False) _get_param_groups name module.module.decoder.layers.43.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.36.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.14.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.47.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.46.mlp.linear_fc1.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.10.self_attention.linear_qkv.weight lr_decay_rate 0.2287679245496101 name module.module.external_feature_model.vit.decoder.layers.18.ls2 lr_decay_rate 0.531441name module.module.external_feature_model.vit.decoder.layers.23.input_layernorm.bias lr_decay_rate 0.9 name module.module.external_feature_model.vit.decoder.layers.20.ls1 lr_decay_rate 0.6561 _get_param_groups name module.module.decoder.layers.12.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.14.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.43.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.46.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.47.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.self_attention.linear_qkv.weight key (1.0, 0.02287679245496101, False, False)_get_param_groups name module.module.decoder.layers.36.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.ls2 key (0.0, 0.05314410000000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.input_layernorm.bias key (0.0, 0.09000000000000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.ls1 key (0.0, 0.06561, False, False) _get_param_groups name module.module.decoder.layers.12.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.43.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.15.input_layernorm.weight key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.10.self_attention.linear_qkv.bias lr_decay_rate 0.2287679245496101 _get_param_groups name module.module.decoder.final_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.36.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.43.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.12.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.18.input_layernorm.weight lr_decay_rate 0.531441 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.self_attention.linear_qkv.bias key (0.0, 0.02287679245496101, False, False)name module.module.external_feature_model.vit.decoder.layers.20.ls2 lr_decay_rate 0.6561 _get_param_groups name module.module.decoder.layers.47.input_layernorm.weight key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.23.self_attention.linear_proj.weight lr_decay_rate 0.9 _get_param_groups name module.module.decoder.layers.15.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.output_layer.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.36.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.12.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.ls2 key (0.0, 0.06561, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.input_layernorm.weight key (0.0, 0.05314410000000001, False, False) _get_param_groups name module.module.decoder.layers.43.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.self_attention.linear_proj.weight key (1.0, 0.09000000000000001, False, False) _get_param_groups name module.module.decoder.layers.47.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.15.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.10.pre_mlp_layernorm.weight lr_decay_rate 0.2287679245496101 _get_param_groups name module.module.decoder.layers.37.input_layernorm.weight key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.18.input_layernorm.bias lr_decay_rate 0.531441_get_param_groups name module.module.decoder.layers.43.mlp.linear_fc1.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.20.input_layernorm.weight lr_decay_rate 0.6561_get_param_groups name module.module.decoder.layers.12.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.23.self_attention.linear_proj.bias lr_decay_rate 0.9 _get_param_groups name module.module.decoder.layers.15.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.47.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.pre_mlp_layernorm.weight key (0.0, 0.02287679245496101, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.input_layernorm.bias key (0.0, 0.05314410000000001, False, False)_get_param_groups name module.module.decoder.layers.37.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.input_layernorm.weight key (0.0, 0.06561, False, False)_get_param_groups name module.module.decoder.layers.43.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.self_attention.linear_proj.bias key (0.0, 0.09000000000000001, False, False) _get_param_groups name module.module.decoder.layers.12.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.47.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.10.pre_mlp_layernorm.bias lr_decay_rate 0.2287679245496101 _get_param_groups name module.module.decoder.layers.15.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.37.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.20.input_layernorm.bias lr_decay_rate 0.6561 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.pre_mlp_layernorm.bias key (0.0, 0.02287679245496101, False, False)_get_param_groups name module.module.decoder.layers.12.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.44.input_layernorm.weight key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.18.self_attention.linear_proj.weight lr_decay_rate 0.531441name module.module.external_feature_model.vit.decoder.layers.23.self_attention.linear_qkv.weight lr_decay_rate 0.9 _get_param_groups name module.module.decoder.layers.37.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.15.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.47.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.input_layernorm.bias key (0.0, 0.06561, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.self_attention.linear_proj.weight key (1.0, 0.05314410000000001, False, False)name module.module.external_feature_model.vit.decoder.layers.10.mlp.linear_fc1.weight lr_decay_rate 0.2287679245496101_get_param_groups name module.module.decoder.layers.13.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.self_attention.linear_qkv.weight key (1.0, 0.09000000000000001, False, False) _get_param_groups name module.module.decoder.layers.15.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.44.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.47.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.37.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.mlp.linear_fc1.weight key (1.0, 0.02287679245496101, False, False)name module.module.external_feature_model.vit.decoder.layers.20.self_attention.linear_proj.weight lr_decay_rate 0.6561name module.module.external_feature_model.vit.decoder.layers.18.self_attention.linear_proj.bias lr_decay_rate 0.531441name module.module.external_feature_model.vit.decoder.layers.23.self_attention.linear_qkv.bias lr_decay_rate 0.9_get_param_groups name module.module.decoder.layers.13.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.44.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.16.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.47.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.self_attention.linear_qkv.bias key (0.0, 0.09000000000000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.self_attention.linear_proj.bias key (0.0, 0.05314410000000001, False, False) _get_param_groups name module.module.decoder.layers.44.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.37.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.13.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.10.mlp.linear_fc1.bias lr_decay_rate 0.2287679245496101_get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.self_attention.linear_proj.weight key (1.0, 0.06561, False, False) _get_param_groups name module.module.decoder.layers.16.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.final_layernorm.weight key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.23.pre_mlp_layernorm.weight lr_decay_rate 0.9 name module.module.external_feature_model.vit.decoder.layers.18.self_attention.linear_qkv.weight lr_decay_rate 0.531441 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.mlp.linear_fc1.bias key (0.0, 0.02287679245496101, False, False)_get_param_groups name module.module.decoder.layers.13.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.37.mlp.linear_fc2.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.20.self_attention.linear_proj.bias lr_decay_rate 0.6561 _get_param_groups name module.module.decoder.layers.44.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.output_layer.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.16.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.pre_mlp_layernorm.weight key (0.0, 0.09000000000000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.self_attention.linear_qkv.weight key (1.0, 0.05314410000000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.self_attention.linear_proj.bias key (0.0, 0.06561, False, False)name module.module.external_feature_model.vit.decoder.layers.10.mlp.linear_fc2.weight lr_decay_rate 0.2287679245496101 _get_param_groups name module.module.decoder.layers.16.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.13.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.38.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.44.mlp.linear_fc1.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.23.pre_mlp_layernorm.bias lr_decay_rate 0.9 name module.module.external_feature_model.vit.decoder.layers.18.self_attention.linear_qkv.bias lr_decay_rate 0.531441 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.mlp.linear_fc2.weight key (1.0, 0.02287679245496101, False, False)name module.module.external_feature_model.vit.decoder.layers.20.self_attention.linear_qkv.weight lr_decay_rate 0.6561 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.self_attention.linear_qkv.bias key (0.0, 0.05314410000000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.pre_mlp_layernorm.bias key (0.0, 0.09000000000000001, False, False) _get_param_groups name module.module.decoder.layers.13.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.self_attention.linear_qkv.weight key (1.0, 0.06561, False, False) _get_param_groups name module.module.decoder.layers.16.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.44.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.38.self_attention.linear_proj.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.10.mlp.linear_fc2.bias lr_decay_rate 0.2287679245496101 name module.module.external_feature_model.vit.decoder.layers.20.self_attention.linear_qkv.bias lr_decay_rate 0.6561_get_param_groups name module.module.decoder.layers.13.mlp.linear_fc2.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.23.mlp.linear_fc1.weight lr_decay_rate 0.9name module.module.external_feature_model.vit.decoder.layers.18.pre_mlp_layernorm.weight lr_decay_rate 0.531441_get_param_groups name module.module.external_feature_model.vit.decoder.layers.10.mlp.linear_fc2.bias key (0.0, 0.02287679245496101, False, False)_get_param_groups name module.module.decoder.layers.16.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.38.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.45.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.self_attention.linear_qkv.bias key (0.0, 0.06561, False, False)_get_param_groups name module.module.decoder.layers.14.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.16.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.38.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.mlp.linear_fc1.weight key (1.0, 0.09000000000000001, False, False)name module.module.external_feature_model.vit.decoder.layers.11.ls1 lr_decay_rate 0.2541865828329001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.pre_mlp_layernorm.weight key (0.0, 0.05314410000000001, False, False)_get_param_groups name module.module.decoder.layers.45.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.17.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.14.self_attention.linear_proj.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.23.mlp.linear_fc1.bias lr_decay_rate 0.9name module.module.external_feature_model.vit.decoder.layers.20.pre_mlp_layernorm.weight lr_decay_rate 0.6561 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.ls1 key (0.0, 0.02541865828329001, False, False)name module.module.external_feature_model.vit.decoder.layers.18.pre_mlp_layernorm.bias lr_decay_rate 0.531441_get_param_groups name module.module.decoder.layers.45.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.38.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.14.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.17.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.pre_mlp_layernorm.weight key (0.0, 0.06561, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.mlp.linear_fc1.bias key (0.0, 0.09000000000000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.pre_mlp_layernorm.bias key (0.0, 0.05314410000000001, False, False) name module.module.external_feature_model.vit.decoder.layers.11.ls2 lr_decay_rate 0.2541865828329001 _get_param_groups name module.module.decoder.layers.45.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.14.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.38.mlp.linear_fc1.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.20.pre_mlp_layernorm.bias lr_decay_rate 0.6561_get_param_groups name module.module.decoder.layers.17.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.23.mlp.linear_fc2.weight lr_decay_rate 0.9 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.ls2 key (0.0, 0.02541865828329001, False, False) name module.module.external_feature_model.vit.decoder.layers.18.mlp.linear_fc1.weight lr_decay_rate 0.531441 _get_param_groups name module.module.decoder.layers.45.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.pre_mlp_layernorm.bias key (0.0, 0.06561, False, False)_get_param_groups name module.module.decoder.layers.14.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.17.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.38.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.mlp.linear_fc2.weight key (1.0, 0.09000000000000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.mlp.linear_fc1.weight key (1.0, 0.05314410000000001, False, False) name module.module.external_feature_model.vit.decoder.layers.11.input_layernorm.weight lr_decay_rate 0.2541865828329001 _get_param_groups name module.module.decoder.layers.45.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.14.mlp.linear_fc1.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.20.mlp.linear_fc1.weight lr_decay_rate 0.6561 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.input_layernorm.weight key (0.0, 0.02541865828329001, False, False)name module.module.external_feature_model.vit.decoder.layers.23.mlp.linear_fc2.bias lr_decay_rate 0.9name module.module.external_feature_model.vit.decoder.layers.18.mlp.linear_fc1.bias lr_decay_rate 0.531441_get_param_groups name module.module.decoder.layers.39.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.45.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.17.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.14.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.mlp.linear_fc1.weight key (1.0, 0.06561, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.mlp.linear_fc2.bias key (0.0, 0.09000000000000001, False, False)name module.module.external_feature_model.vit.decoder.layers.11.input_layernorm.bias lr_decay_rate 0.2541865828329001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.mlp.linear_fc1.bias key (0.0, 0.05314410000000001, False, False)name module.module.external_feature_model.vit.decoder.layers.20.mlp.linear_fc1.bias lr_decay_rate 0.6561 _get_param_groups name module.module.decoder.layers.46.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.39.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.17.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.15.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.mlp.linear_fc1.bias key (0.0, 0.06561, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.input_layernorm.bias key (0.0, 0.02541865828329001, False, False) name module.module.external_feature_model.vit.decoder.layers.18.mlp.linear_fc2.weight lr_decay_rate 0.531441_get_param_groups name module.module.decoder.layers.17.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vision_projection.encoder.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.39.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.46.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.15.self_attention.linear_proj.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.20.mlp.linear_fc2.weight lr_decay_rate 0.6561 name module.module.external_feature_model.vit.decoder.layers.11.self_attention.linear_proj.weight lr_decay_rate 0.2541865828329001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.mlp.linear_fc2.weight key (1.0, 0.05314410000000001, False, False) _get_param_groups name module.module.decoder.layers.15.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.39.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.46.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.mlp.linear_fc2.weight key (1.0, 0.06561, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.self_attention.linear_proj.weight key (1.0, 0.02541865828329001, False, False) _get_param_groups name module.module.external_feature_model.vision_projection.encoder.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.18.input_layernorm.weight key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.18.mlp.linear_fc2.bias lr_decay_rate 0.531441_get_param_groups name module.module.decoder.layers.15.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.46.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.20.mlp.linear_fc2.bias lr_decay_rate 0.6561name module.module.external_feature_model.vit.decoder.layers.11.self_attention.linear_proj.bias lr_decay_rate 0.2541865828329001 _get_param_groups name module.module.external_feature_model.pre_proj_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.39.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.18.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.mlp.linear_fc2.bias key (0.0, 0.05314410000000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.mlp.linear_fc2.bias key (0.0, 0.06561, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.self_attention.linear_proj.bias key (0.0, 0.02541865828329001, False, False) _get_param_groups name module.module.external_feature_model.pre_proj_layernorm.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.15.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.46.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.18.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.39.mlp.linear_fc1.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.19.ls1 lr_decay_rate 0.5904900000000001 name module.module.external_feature_model.vit.decoder.layers.21.ls1 lr_decay_rate 0.7290000000000001 name module.module.external_feature_model.vit.decoder.layers.11.self_attention.linear_qkv.weight lr_decay_rate 0.2541865828329001 _get_param_groups name module.module.decoder.layers.46.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.15.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.18.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.39.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.embedding.word_embeddings.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.ls1 key (0.0, 0.0729, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.ls1 key (0.0, 0.05904900000000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.self_attention.linear_qkv.weight key (1.0, 0.02541865828329001, False, False) _get_param_groups name module.module.decoder.layers.46.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.15.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.18.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.11.self_attention.linear_qkv.bias lr_decay_rate 0.2541865828329001 _get_param_groups name module.module.decoder.layers.40.input_layernorm.weight key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.21.ls2 lr_decay_rate 0.7290000000000001 name module.module.external_feature_model.vit.decoder.layers.19.ls2 lr_decay_rate 0.5904900000000001 _get_param_groups name module.module.decoder.layers.16.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.0.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.18.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.self_attention.linear_qkv.bias key (0.0, 0.02541865828329001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.ls2 key (0.0, 0.0729, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.ls2 key (0.0, 0.05904900000000001, False, False)_get_param_groups name module.module.decoder.layers.47.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.40.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.18.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.16.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.0.self_attention.linear_proj.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.21.input_layernorm.weight lr_decay_rate 0.7290000000000001name module.module.external_feature_model.vit.decoder.layers.11.pre_mlp_layernorm.weight lr_decay_rate 0.2541865828329001 _get_param_groups name module.module.decoder.layers.40.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.19.input_layernorm.weight lr_decay_rate 0.5904900000000001 _get_param_groups name module.module.decoder.layers.19.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.16.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.47.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.0.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.input_layernorm.weight key (0.0, 0.0729, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.pre_mlp_layernorm.weight key (0.0, 0.02541865828329001, False, False) _get_param_groups name module.module.decoder.layers.40.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.input_layernorm.weight key (0.0, 0.05904900000000001, False, False) _get_param_groups name module.module.decoder.layers.16.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.0.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.47.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.21.input_layernorm.bias lr_decay_rate 0.7290000000000001_get_param_groups name module.module.decoder.layers.19.self_attention.linear_proj.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.11.pre_mlp_layernorm.bias lr_decay_rate 0.2541865828329001 name module.module.external_feature_model.vit.decoder.layers.19.input_layernorm.bias lr_decay_rate 0.5904900000000001 _get_param_groups name module.module.decoder.layers.40.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.47.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.input_layernorm.bias key (0.0, 0.0729, False, False) _get_param_groups name module.module.decoder.layers.16.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.input_layernorm.bias key (0.0, 0.05904900000000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.pre_mlp_layernorm.bias key (0.0, 0.02541865828329001, False, False)_get_param_groups name module.module.decoder.layers.19.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.0.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.40.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.47.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.21.self_attention.linear_proj.weight lr_decay_rate 0.7290000000000001_get_param_groups name module.module.decoder.layers.19.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.16.mlp.linear_fc1.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.11.mlp.linear_fc1.weight lr_decay_rate 0.2541865828329001 _get_param_groups name module.module.decoder.layers.0.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.40.mlp.linear_fc2.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.19.self_attention.linear_proj.weight lr_decay_rate 0.5904900000000001 _get_param_groups name module.module.decoder.layers.47.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.self_attention.linear_proj.weight key (1.0, 0.0729, False, False) _get_param_groups name module.module.decoder.layers.16.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.mlp.linear_fc1.weight key (1.0, 0.02541865828329001, False, False) _get_param_groups name module.module.decoder.layers.19.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.0.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.41.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.self_attention.linear_proj.weight key (1.0, 0.05904900000000001, False, False)_get_param_groups name module.module.decoder.layers.47.mlp.linear_fc2.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.21.self_attention.linear_proj.bias lr_decay_rate 0.7290000000000001 _get_param_groups name module.module.decoder.layers.17.input_layernorm.weight key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.11.mlp.linear_fc1.bias lr_decay_rate 0.2541865828329001 _get_param_groups name module.module.decoder.layers.19.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.1.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.self_attention.linear_proj.bias key (0.0, 0.0729, False, False) _get_param_groups name module.module.decoder.final_layernorm.weight key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.19.self_attention.linear_proj.bias lr_decay_rate 0.5904900000000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.mlp.linear_fc1.bias key (0.0, 0.02541865828329001, False, False)_get_param_groups name module.module.decoder.layers.41.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.19.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.17.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.1.self_attention.linear_proj.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.21.self_attention.linear_qkv.weight lr_decay_rate 0.7290000000000001 _get_param_groups name module.module.output_layer.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.self_attention.linear_proj.bias key (0.0, 0.05904900000000001, False, False)_get_param_groups name module.module.decoder.layers.41.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.20.input_layernorm.weight key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.11.mlp.linear_fc2.weight lr_decay_rate 0.2541865828329001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.self_attention.linear_qkv.weight key (1.0, 0.0729, False, False) _get_param_groups name module.module.decoder.layers.1.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.17.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.41.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.19.self_attention.linear_qkv.weight lr_decay_rate 0.5904900000000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.mlp.linear_fc2.weight key (1.0, 0.02541865828329001, False, False) _get_param_groups name module.module.decoder.layers.20.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.1.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.17.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.21.self_attention.linear_qkv.bias lr_decay_rate 0.7290000000000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.self_attention.linear_qkv.weight key (1.0, 0.05904900000000001, False, False) _get_param_groups name module.module.decoder.layers.41.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.11.mlp.linear_fc2.bias lr_decay_rate 0.2541865828329001 _get_param_groups name module.module.decoder.layers.20.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.self_attention.linear_qkv.bias key (0.0, 0.0729, False, False) _get_param_groups name module.module.decoder.layers.1.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.19.self_attention.linear_qkv.bias lr_decay_rate 0.5904900000000001_get_param_groups name module.module.decoder.layers.17.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.11.mlp.linear_fc2.bias key (0.0, 0.02541865828329001, False, False)_get_param_groups name module.module.decoder.layers.41.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.20.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.self_attention.linear_qkv.bias key (0.0, 0.05904900000000001, False, False)name module.module.external_feature_model.vit.decoder.layers.21.pre_mlp_layernorm.weight lr_decay_rate 0.7290000000000001_get_param_groups name module.module.decoder.layers.1.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.17.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.41.mlp.linear_fc2.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.12.ls1 lr_decay_rate 0.2824295364810001 _get_param_groups name module.module.decoder.layers.20.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.pre_mlp_layernorm.weight key (0.0, 0.0729, False, False)_get_param_groups name module.module.decoder.layers.1.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.17.mlp.linear_fc2.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.19.pre_mlp_layernorm.weight lr_decay_rate 0.5904900000000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.ls1 key (0.0, 0.028242953648100012, False, False)_get_param_groups name module.module.decoder.layers.20.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.42.input_layernorm.weight key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.21.pre_mlp_layernorm.bias lr_decay_rate 0.7290000000000001 _get_param_groups name module.module.decoder.layers.2.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.18.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.pre_mlp_layernorm.weight key (0.0, 0.05904900000000001, False, False) _get_param_groups name module.module.decoder.layers.20.mlp.linear_fc2.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.12.ls2 lr_decay_rate 0.2824295364810001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.pre_mlp_layernorm.bias key (0.0, 0.0729, False, False) _get_param_groups name module.module.decoder.layers.42.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.2.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.18.self_attention.linear_proj.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.19.pre_mlp_layernorm.bias lr_decay_rate 0.5904900000000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.ls2 key (0.0, 0.028242953648100012, False, False) _get_param_groups name module.module.decoder.layers.21.input_layernorm.weight key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.21.mlp.linear_fc1.weight lr_decay_rate 0.7290000000000001_get_param_groups name module.module.decoder.layers.42.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.2.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.pre_mlp_layernorm.bias key (0.0, 0.05904900000000001, False, False) _get_param_groups name module.module.decoder.layers.18.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.12.input_layernorm.weight lr_decay_rate 0.2824295364810001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.mlp.linear_fc1.weight key (1.0, 0.0729, False, False)_get_param_groups name module.module.decoder.layers.21.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.2.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.42.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.18.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.input_layernorm.weight key (0.0, 0.028242953648100012, False, False)name module.module.external_feature_model.vit.decoder.layers.19.mlp.linear_fc1.weight lr_decay_rate 0.5904900000000001 name module.module.external_feature_model.vit.decoder.layers.21.mlp.linear_fc1.bias lr_decay_rate 0.7290000000000001 _get_param_groups name module.module.decoder.layers.21.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.2.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.mlp.linear_fc1.weight key (1.0, 0.05904900000000001, False, False)_get_param_groups name module.module.decoder.layers.42.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.18.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.12.input_layernorm.bias lr_decay_rate 0.2824295364810001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.mlp.linear_fc1.bias key (0.0, 0.0729, False, False) _get_param_groups name module.module.decoder.layers.21.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.2.mlp.linear_fc1.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.19.mlp.linear_fc1.bias lr_decay_rate 0.5904900000000001_get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.input_layernorm.bias key (0.0, 0.028242953648100012, False, False) _get_param_groups name module.module.decoder.layers.18.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.42.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.2.mlp.linear_fc2.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.21.mlp.linear_fc2.weight lr_decay_rate 0.7290000000000001 _get_param_groups name module.module.decoder.layers.21.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.mlp.linear_fc1.bias key (0.0, 0.05904900000000001, False, False) _get_param_groups name module.module.decoder.layers.18.mlp.linear_fc2.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.12.self_attention.linear_proj.weight lr_decay_rate 0.2824295364810001 _get_param_groups name module.module.decoder.layers.3.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.mlp.linear_fc2.weight key (1.0, 0.0729, False, False) _get_param_groups name module.module.decoder.layers.42.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.21.mlp.linear_fc1.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.19.mlp.linear_fc2.weight lr_decay_rate 0.5904900000000001_get_param_groups name module.module.decoder.layers.19.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.self_attention.linear_proj.weight key (1.0, 0.028242953648100012, False, False) name module.module.external_feature_model.vit.decoder.layers.21.mlp.linear_fc2.bias lr_decay_rate 0.7290000000000001 _get_param_groups name module.module.decoder.layers.3.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.43.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.mlp.linear_fc2.weight key (1.0, 0.05904900000000001, False, False) _get_param_groups name module.module.decoder.layers.21.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.mlp.linear_fc2.bias key (0.0, 0.0729, False, False) _get_param_groups name module.module.decoder.layers.19.self_attention.linear_proj.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.12.self_attention.linear_proj.bias lr_decay_rate 0.2824295364810001 _get_param_groups name module.module.decoder.layers.3.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.19.mlp.linear_fc2.bias lr_decay_rate 0.5904900000000001 _get_param_groups name module.module.decoder.layers.43.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.22.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.self_attention.linear_proj.bias key (0.0, 0.028242953648100012, False, False) _get_param_groups name module.module.decoder.layers.19.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.3.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.22.ls1 lr_decay_rate 0.81 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.mlp.linear_fc2.bias key (0.0, 0.05904900000000001, False, False) _get_param_groups name module.module.decoder.layers.43.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.19.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.12.self_attention.linear_qkv.weight lr_decay_rate 0.2824295364810001_get_param_groups name module.module.decoder.layers.22.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.ls1 key (0.0, 0.08100000000000002, False, False) _get_param_groups name module.module.decoder.layers.3.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.43.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.20.ls1 lr_decay_rate 0.6561 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.self_attention.linear_qkv.weight key (1.0, 0.028242953648100012, False, False) _get_param_groups name module.module.decoder.layers.22.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.19.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.22.ls2 lr_decay_rate 0.81 _get_param_groups name module.module.decoder.layers.3.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.ls1 key (0.0, 0.06561, False, False) _get_param_groups name module.module.decoder.layers.43.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.12.self_attention.linear_qkv.bias lr_decay_rate 0.2824295364810001 _get_param_groups name module.module.decoder.layers.22.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.ls2 key (0.0, 0.08100000000000002, False, False) _get_param_groups name module.module.decoder.layers.19.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.3.mlp.linear_fc2.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.20.ls2 lr_decay_rate 0.6561 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.self_attention.linear_qkv.bias key (0.0, 0.028242953648100012, False, False) _get_param_groups name module.module.decoder.layers.43.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.19.mlp.linear_fc2.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.22.input_layernorm.weight lr_decay_rate 0.81 _get_param_groups name module.module.decoder.layers.22.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.ls2 key (0.0, 0.06561, False, False)_get_param_groups name module.module.decoder.layers.4.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.43.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.input_layernorm.weight key (0.0, 0.08100000000000002, False, False) _get_param_groups name module.module.decoder.layers.20.input_layernorm.weight key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.12.pre_mlp_layernorm.weight lr_decay_rate 0.2824295364810001 _get_param_groups name module.module.decoder.layers.22.mlp.linear_fc1.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.20.input_layernorm.weight lr_decay_rate 0.6561 _get_param_groups name module.module.decoder.layers.4.self_attention.linear_proj.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.22.input_layernorm.bias lr_decay_rate 0.81_get_param_groups name module.module.decoder.layers.44.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.pre_mlp_layernorm.weight key (0.0, 0.028242953648100012, False, False) _get_param_groups name module.module.decoder.layers.20.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.22.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.input_layernorm.weight key (0.0, 0.06561, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.input_layernorm.bias key (0.0, 0.08100000000000002, False, False) _get_param_groups name module.module.decoder.layers.4.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.12.pre_mlp_layernorm.bias lr_decay_rate 0.2824295364810001 _get_param_groups name module.module.decoder.layers.20.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.23.input_layernorm.weight key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.20.input_layernorm.bias lr_decay_rate 0.6561 _get_param_groups name module.module.decoder.layers.44.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.pre_mlp_layernorm.bias key (0.0, 0.028242953648100012, False, False)_get_param_groups name module.module.decoder.layers.4.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.22.self_attention.linear_proj.weight lr_decay_rate 0.81_get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.input_layernorm.bias key (0.0, 0.06561, False, False) _get_param_groups name module.module.decoder.layers.20.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.44.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.23.self_attention.linear_proj.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.12.mlp.linear_fc1.weight lr_decay_rate 0.2824295364810001 _get_param_groups name module.module.decoder.layers.4.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.self_attention.linear_proj.weight key (1.0, 0.08100000000000002, False, False) _get_param_groups name module.module.decoder.layers.44.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.23.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.mlp.linear_fc1.weight key (1.0, 0.028242953648100012, False, False)_get_param_groups name module.module.decoder.layers.20.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.20.self_attention.linear_proj.weight lr_decay_rate 0.6561_get_param_groups name module.module.decoder.layers.4.mlp.linear_fc1.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.22.self_attention.linear_proj.bias lr_decay_rate 0.81 _get_param_groups name module.module.decoder.layers.23.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.44.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.12.mlp.linear_fc1.bias lr_decay_rate 0.2824295364810001_get_param_groups name module.module.decoder.layers.20.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.self_attention.linear_proj.weight key (1.0, 0.06561, False, False) _get_param_groups name module.module.decoder.layers.4.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.self_attention.linear_proj.bias key (0.0, 0.08100000000000002, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.mlp.linear_fc1.bias key (0.0, 0.028242953648100012, False, False)_get_param_groups name module.module.decoder.layers.23.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.44.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.20.mlp.linear_fc2.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.20.self_attention.linear_proj.bias lr_decay_rate 0.6561 _get_param_groups name module.module.decoder.layers.5.input_layernorm.weight key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.22.self_attention.linear_qkv.weight lr_decay_rate 0.81 _get_param_groups name module.module.decoder.layers.23.mlp.linear_fc1.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.12.mlp.linear_fc2.weight lr_decay_rate 0.2824295364810001 _get_param_groups name module.module.decoder.layers.44.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.self_attention.linear_proj.bias key (0.0, 0.06561, False, False)_get_param_groups name module.module.decoder.layers.21.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.self_attention.linear_qkv.weight key (1.0, 0.08100000000000002, False, False) _get_param_groups name module.module.decoder.layers.5.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.23.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.mlp.linear_fc2.weight key (1.0, 0.028242953648100012, False, False) name module.module.external_feature_model.vit.decoder.layers.22.self_attention.linear_qkv.bias lr_decay_rate 0.81_get_param_groups name module.module.decoder.layers.45.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.5.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.20.self_attention.linear_qkv.weight lr_decay_rate 0.6561_get_param_groups name module.module.decoder.layers.21.self_attention.linear_proj.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.12.mlp.linear_fc2.bias lr_decay_rate 0.2824295364810001 _get_param_groups name module.module.decoder.layers.24.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.self_attention.linear_qkv.bias key (0.0, 0.08100000000000002, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.12.mlp.linear_fc2.bias key (0.0, 0.028242953648100012, False, False) _get_param_groups name module.module.decoder.layers.5.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.self_attention.linear_qkv.weight key (1.0, 0.06561, False, False) _get_param_groups name module.module.decoder.layers.21.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.24.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.45.self_attention.linear_proj.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.13.ls1 lr_decay_rate 0.31381059609000006name module.module.external_feature_model.vit.decoder.layers.20.self_attention.linear_qkv.bias lr_decay_rate 0.6561name module.module.external_feature_model.vit.decoder.layers.22.pre_mlp_layernorm.weight lr_decay_rate 0.81_get_param_groups name module.module.decoder.layers.5.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.21.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.24.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.45.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.self_attention.linear_qkv.bias key (0.0, 0.06561, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.pre_mlp_layernorm.weight key (0.0, 0.08100000000000002, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.ls1 key (0.0, 0.031381059609000006, False, False) _get_param_groups name module.module.decoder.layers.24.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.5.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.45.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.21.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.22.pre_mlp_layernorm.bias lr_decay_rate 0.81 name module.module.external_feature_model.vit.decoder.layers.13.ls2 lr_decay_rate 0.31381059609000006 _get_param_groups name module.module.decoder.layers.5.mlp.linear_fc2.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.20.pre_mlp_layernorm.weight lr_decay_rate 0.6561 _get_param_groups name module.module.decoder.layers.24.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.45.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.pre_mlp_layernorm.bias key (0.0, 0.08100000000000002, False, False) _get_param_groups name module.module.decoder.layers.21.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.ls2 key (0.0, 0.031381059609000006, False, False)_get_param_groups name module.module.decoder.layers.6.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.pre_mlp_layernorm.weight key (0.0, 0.06561, False, False) _get_param_groups name module.module.decoder.layers.45.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.24.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.21.mlp.linear_fc2.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.22.mlp.linear_fc1.weight lr_decay_rate 0.81 name module.module.external_feature_model.vit.decoder.layers.20.pre_mlp_layernorm.bias lr_decay_rate 0.6561 name module.module.external_feature_model.vit.decoder.layers.13.input_layernorm.weight lr_decay_rate 0.31381059609000006_get_param_groups name module.module.decoder.layers.6.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.45.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.mlp.linear_fc1.weight key (1.0, 0.08100000000000002, False, False)_get_param_groups name module.module.decoder.layers.24.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.pre_mlp_layernorm.bias key (0.0, 0.06561, False, False)_get_param_groups name module.module.decoder.layers.22.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.input_layernorm.weight key (0.0, 0.031381059609000006, False, False)_get_param_groups name module.module.decoder.layers.6.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.46.input_layernorm.weight key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.22.mlp.linear_fc1.bias lr_decay_rate 0.81 _get_param_groups name module.module.decoder.layers.25.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.6.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.20.mlp.linear_fc1.weight lr_decay_rate 0.6561name module.module.external_feature_model.vit.decoder.layers.13.input_layernorm.bias lr_decay_rate 0.31381059609000006 _get_param_groups name module.module.decoder.layers.22.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.mlp.linear_fc1.bias key (0.0, 0.08100000000000002, False, False) _get_param_groups name module.module.decoder.layers.46.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.input_layernorm.bias key (0.0, 0.031381059609000006, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.mlp.linear_fc1.weight key (1.0, 0.06561, False, False) _get_param_groups name module.module.decoder.layers.6.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.25.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.22.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.22.mlp.linear_fc2.weight lr_decay_rate 0.81 _get_param_groups name module.module.decoder.layers.46.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.20.mlp.linear_fc1.bias lr_decay_rate 0.6561_get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.mlp.linear_fc2.weight key (1.0, 0.08100000000000002, False, False)_get_param_groups name module.module.decoder.layers.25.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.22.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.6.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.46.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.13.self_attention.linear_proj.weight lr_decay_rate 0.31381059609000006 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.mlp.linear_fc1.bias key (0.0, 0.06561, False, False) name module.module.external_feature_model.vit.decoder.layers.22.mlp.linear_fc2.bias lr_decay_rate 0.81_get_param_groups name module.module.decoder.layers.25.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.6.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.self_attention.linear_proj.weight key (1.0, 0.031381059609000006, False, False) _get_param_groups name module.module.decoder.layers.22.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.mlp.linear_fc2.bias key (0.0, 0.08100000000000002, False, False)_get_param_groups name module.module.decoder.layers.46.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.20.mlp.linear_fc2.weight lr_decay_rate 0.6561 _get_param_groups name module.module.decoder.layers.7.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.25.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.13.self_attention.linear_proj.bias lr_decay_rate 0.31381059609000006 _get_param_groups name module.module.decoder.layers.22.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.mlp.linear_fc2.weight key (1.0, 0.06561, False, False) _get_param_groups name module.module.decoder.layers.46.mlp.linear_fc1.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.23.ls1 lr_decay_rate 0.9_get_param_groups name module.module.decoder.layers.25.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.self_attention.linear_proj.bias key (0.0, 0.031381059609000006, False, False) _get_param_groups name module.module.decoder.layers.7.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.22.mlp.linear_fc2.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.20.mlp.linear_fc2.bias lr_decay_rate 0.6561 _get_param_groups name module.module.decoder.layers.46.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.ls1 key (0.0, 0.09000000000000001, False, False) _get_param_groups name module.module.decoder.layers.25.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.7.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.mlp.linear_fc2.bias key (0.0, 0.06561, False, False)name module.module.external_feature_model.vit.decoder.layers.13.self_attention.linear_qkv.weight lr_decay_rate 0.31381059609000006_get_param_groups name module.module.decoder.layers.23.input_layernorm.weight key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.23.ls2 lr_decay_rate 0.9 _get_param_groups name module.module.decoder.layers.26.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.self_attention.linear_qkv.weight key (1.0, 0.031381059609000006, False, False) _get_param_groups name module.module.decoder.layers.7.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.47.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.ls2 key (0.0, 0.09000000000000001, False, False) _get_param_groups name module.module.decoder.layers.23.self_attention.linear_proj.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.21.ls1 lr_decay_rate 0.7290000000000001 name module.module.external_feature_model.vit.decoder.layers.13.self_attention.linear_qkv.bias lr_decay_rate 0.31381059609000006_get_param_groups name module.module.decoder.layers.26.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.7.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.23.input_layernorm.weight lr_decay_rate 0.9_get_param_groups name module.module.decoder.layers.23.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.47.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.ls1 key (0.0, 0.0729, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.self_attention.linear_qkv.bias key (0.0, 0.031381059609000006, False, False) _get_param_groups name module.module.decoder.layers.26.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.7.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.input_layernorm.weight key (0.0, 0.09000000000000001, False, False) _get_param_groups name module.module.decoder.layers.23.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.47.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.26.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.7.mlp.linear_fc2.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.21.ls2 lr_decay_rate 0.7290000000000001 name module.module.external_feature_model.vit.decoder.layers.13.pre_mlp_layernorm.weight lr_decay_rate 0.31381059609000006 name module.module.external_feature_model.vit.decoder.layers.23.input_layernorm.bias lr_decay_rate 0.9 _get_param_groups name module.module.decoder.layers.23.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.47.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.ls2 key (0.0, 0.0729, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.pre_mlp_layernorm.weight key (0.0, 0.031381059609000006, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.input_layernorm.bias key (0.0, 0.09000000000000001, False, False)_get_param_groups name module.module.decoder.layers.8.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.26.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.23.mlp.linear_fc1.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.13.pre_mlp_layernorm.bias lr_decay_rate 0.31381059609000006name module.module.external_feature_model.vit.decoder.layers.21.input_layernorm.weight lr_decay_rate 0.7290000000000001_get_param_groups name module.module.decoder.layers.47.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.26.mlp.linear_fc1.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.23.self_attention.linear_proj.weight lr_decay_rate 0.9 _get_param_groups name module.module.decoder.layers.8.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.input_layernorm.weight key (0.0, 0.0729, False, False) _get_param_groups name module.module.decoder.layers.26.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.23.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.pre_mlp_layernorm.bias key (0.0, 0.031381059609000006, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.self_attention.linear_proj.weight key (1.0, 0.09000000000000001, False, False)_get_param_groups name module.module.decoder.layers.8.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.47.mlp.linear_fc1.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.21.input_layernorm.bias lr_decay_rate 0.7290000000000001 _get_param_groups name module.module.decoder.layers.27.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.8.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.24.input_layernorm.weight key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.13.mlp.linear_fc1.weight lr_decay_rate 0.31381059609000006 name module.module.external_feature_model.vit.decoder.layers.23.self_attention.linear_proj.bias lr_decay_rate 0.9 _get_param_groups name module.module.decoder.layers.47.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.input_layernorm.bias key (0.0, 0.0729, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.self_attention.linear_proj.bias key (0.0, 0.09000000000000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.mlp.linear_fc1.weight key (1.0, 0.031381059609000006, False, False) _get_param_groups name module.module.decoder.layers.27.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.24.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.final_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.8.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.21.self_attention.linear_proj.weight lr_decay_rate 0.7290000000000001 name module.module.external_feature_model.vit.decoder.layers.13.mlp.linear_fc1.bias lr_decay_rate 0.31381059609000006 name module.module.external_feature_model.vit.decoder.layers.23.self_attention.linear_qkv.weight lr_decay_rate 0.9 _get_param_groups name module.module.decoder.layers.27.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.24.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.8.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.output_layer.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.self_attention.linear_proj.weight key (1.0, 0.0729, False, False) _get_param_groups name module.module.decoder.layers.27.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.mlp.linear_fc1.bias key (0.0, 0.031381059609000006, False, False) _get_param_groups name module.module.decoder.layers.8.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.self_attention.linear_qkv.weight key (1.0, 0.09000000000000001, False, False)name module.module.external_feature_model.vit.decoder.layers.21.self_attention.linear_proj.bias lr_decay_rate 0.7290000000000001 _get_param_groups name module.module.decoder.layers.24.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.13.mlp.linear_fc2.weight lr_decay_rate 0.31381059609000006 _get_param_groups name module.module.decoder.layers.27.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.self_attention.linear_proj.bias key (0.0, 0.0729, False, False) name module.module.external_feature_model.vit.decoder.layers.23.self_attention.linear_qkv.bias lr_decay_rate 0.9_get_param_groups name module.module.decoder.layers.9.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.mlp.linear_fc2.weight key (1.0, 0.031381059609000006, False, False) _get_param_groups name module.module.decoder.layers.24.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.27.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.self_attention.linear_qkv.bias key (0.0, 0.09000000000000001, False, False) name module.module.external_feature_model.vit.decoder.layers.21.self_attention.linear_qkv.weight lr_decay_rate 0.7290000000000001 _get_param_groups name module.module.decoder.layers.9.self_attention.linear_proj.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.13.mlp.linear_fc2.bias lr_decay_rate 0.31381059609000006 _get_param_groups name module.module.decoder.layers.24.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.27.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.self_attention.linear_qkv.weight key (1.0, 0.0729, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.13.mlp.linear_fc2.bias key (0.0, 0.031381059609000006, False, False) name module.module.external_feature_model.vit.decoder.layers.23.pre_mlp_layernorm.weight lr_decay_rate 0.9_get_param_groups name module.module.decoder.layers.9.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.24.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.28.input_layernorm.weight key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.21.self_attention.linear_qkv.bias lr_decay_rate 0.7290000000000001 _get_param_groups name module.module.decoder.layers.9.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.pre_mlp_layernorm.weight key (0.0, 0.09000000000000001, False, False) name module.module.external_feature_model.vit.decoder.layers.14.ls1 lr_decay_rate 0.3486784401000001 _get_param_groups name module.module.decoder.layers.25.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.self_attention.linear_qkv.bias key (0.0, 0.0729, False, False) _get_param_groups name module.module.decoder.layers.28.self_attention.linear_proj.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.23.pre_mlp_layernorm.bias lr_decay_rate 0.9 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.ls1 key (0.0, 0.03486784401000001, False, False) _get_param_groups name module.module.decoder.layers.9.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.25.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.28.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.pre_mlp_layernorm.bias key (0.0, 0.09000000000000001, False, False) name module.module.external_feature_model.vit.decoder.layers.14.ls2 lr_decay_rate 0.3486784401000001_get_param_groups name module.module.decoder.layers.9.mlp.linear_fc1.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.21.pre_mlp_layernorm.weight lr_decay_rate 0.7290000000000001_get_param_groups name module.module.decoder.layers.28.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.25.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.23.mlp.linear_fc1.weight lr_decay_rate 0.9 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.ls2 key (0.0, 0.03486784401000001, False, False)_get_param_groups name module.module.decoder.layers.9.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.pre_mlp_layernorm.weight key (0.0, 0.0729, False, False)_get_param_groups name module.module.decoder.layers.25.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.mlp.linear_fc1.weight key (1.0, 0.09000000000000001, False, False) _get_param_groups name module.module.decoder.layers.28.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.10.input_layernorm.weight key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.14.input_layernorm.weight lr_decay_rate 0.3486784401000001 name module.module.external_feature_model.vit.decoder.layers.21.pre_mlp_layernorm.bias lr_decay_rate 0.7290000000000001 name module.module.external_feature_model.vit.decoder.layers.23.mlp.linear_fc1.bias lr_decay_rate 0.9 _get_param_groups name module.module.decoder.layers.28.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.25.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.input_layernorm.weight key (0.0, 0.03486784401000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.pre_mlp_layernorm.bias key (0.0, 0.0729, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.mlp.linear_fc1.bias key (0.0, 0.09000000000000001, False, False) _get_param_groups name module.module.decoder.layers.10.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.28.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.25.mlp.linear_fc1.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.14.input_layernorm.bias lr_decay_rate 0.3486784401000001 name module.module.external_feature_model.vit.decoder.layers.23.mlp.linear_fc2.weight lr_decay_rate 0.9_get_param_groups name module.module.decoder.layers.10.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.29.input_layernorm.weight key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.21.mlp.linear_fc1.weight lr_decay_rate 0.7290000000000001 _get_param_groups name module.module.decoder.layers.25.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.input_layernorm.bias key (0.0, 0.03486784401000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.mlp.linear_fc2.weight key (1.0, 0.09000000000000001, False, False) _get_param_groups name module.module.decoder.layers.10.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.mlp.linear_fc1.weight key (1.0, 0.0729, False, False) _get_param_groups name module.module.decoder.layers.29.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.26.input_layernorm.weight key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.23.mlp.linear_fc2.bias lr_decay_rate 0.9 name module.module.external_feature_model.vit.decoder.layers.14.self_attention.linear_proj.weight lr_decay_rate 0.3486784401000001 name module.module.external_feature_model.vit.decoder.layers.21.mlp.linear_fc1.bias lr_decay_rate 0.7290000000000001 _get_param_groups name module.module.decoder.layers.10.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.29.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.mlp.linear_fc2.bias key (0.0, 0.09000000000000001, False, False) _get_param_groups name module.module.decoder.layers.26.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.self_attention.linear_proj.weight key (1.0, 0.03486784401000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.mlp.linear_fc1.bias key (0.0, 0.0729, False, False) _get_param_groups name module.module.decoder.layers.10.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.29.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.26.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vision_projection.encoder.linear_fc1.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.14.self_attention.linear_proj.bias lr_decay_rate 0.3486784401000001 _get_param_groups name module.module.decoder.layers.10.mlp.linear_fc2.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.21.mlp.linear_fc2.weight lr_decay_rate 0.7290000000000001 _get_param_groups name module.module.decoder.layers.29.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.26.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.self_attention.linear_proj.bias key (0.0, 0.03486784401000001, False, False) _get_param_groups name module.module.external_feature_model.vision_projection.encoder.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.mlp.linear_fc2.weight key (1.0, 0.0729, False, False) _get_param_groups name module.module.decoder.layers.11.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.29.mlp.linear_fc1.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.14.self_attention.linear_qkv.weight lr_decay_rate 0.3486784401000001 _get_param_groups name module.module.decoder.layers.26.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.21.mlp.linear_fc2.bias lr_decay_rate 0.7290000000000001 _get_param_groups name module.module.external_feature_model.pre_proj_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.29.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.11.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.self_attention.linear_qkv.weight key (1.0, 0.03486784401000001, False, False) _get_param_groups name module.module.decoder.layers.26.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.mlp.linear_fc2.bias key (0.0, 0.0729, False, False) _get_param_groups name module.module.external_feature_model.pre_proj_layernorm.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.30.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.11.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.14.self_attention.linear_qkv.bias lr_decay_rate 0.3486784401000001 _get_param_groups name module.module.decoder.layers.26.mlp.linear_fc2.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.22.ls1 lr_decay_rate 0.81 _get_param_groups name module.module.decoder.layers.11.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.self_attention.linear_qkv.bias key (0.0, 0.03486784401000001, False, False) _get_param_groups name module.module.embedding.word_embeddings.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.30.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.27.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.ls1 key (0.0, 0.08100000000000002, False, False) _get_param_groups name module.module.decoder.layers.11.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.30.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.14.pre_mlp_layernorm.weight lr_decay_rate 0.3486784401000001 _get_param_groups name module.module.decoder.layers.0.input_layernorm.weight key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.22.ls2 lr_decay_rate 0.81 _get_param_groups name module.module.decoder.layers.27.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.30.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.11.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.pre_mlp_layernorm.weight key (0.0, 0.03486784401000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.ls2 key (0.0, 0.08100000000000002, False, False)_get_param_groups name module.module.decoder.layers.11.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.27.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.0.self_attention.linear_proj.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.14.pre_mlp_layernorm.bias lr_decay_rate 0.3486784401000001_get_param_groups name module.module.decoder.layers.30.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.27.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.pre_mlp_layernorm.bias key (0.0, 0.03486784401000001, False, False)name module.module.external_feature_model.vit.decoder.layers.22.input_layernorm.weight lr_decay_rate 0.81_get_param_groups name module.module.decoder.layers.0.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.12.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.30.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.27.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.input_layernorm.weight key (0.0, 0.08100000000000002, False, False) _get_param_groups name module.module.decoder.layers.0.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.14.mlp.linear_fc1.weight lr_decay_rate 0.3486784401000001_get_param_groups name module.module.decoder.layers.12.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.30.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.27.mlp.linear_fc1.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.22.input_layernorm.bias lr_decay_rate 0.81 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.mlp.linear_fc1.weight key (1.0, 0.03486784401000001, False, False) _get_param_groups name module.module.decoder.layers.12.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.31.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.0.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.input_layernorm.bias key (0.0, 0.08100000000000002, False, False) _get_param_groups name module.module.decoder.layers.27.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.12.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.14.mlp.linear_fc1.bias lr_decay_rate 0.3486784401000001 _get_param_groups name module.module.decoder.layers.0.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.mlp.linear_fc1.bias key (0.0, 0.03486784401000001, False, False)_get_param_groups name module.module.decoder.layers.31.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.28.input_layernorm.weight key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.22.self_attention.linear_proj.weight lr_decay_rate 0.81 _get_param_groups name module.module.decoder.layers.12.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.0.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.31.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.self_attention.linear_proj.weight key (1.0, 0.08100000000000002, False, False) name module.module.external_feature_model.vit.decoder.layers.14.mlp.linear_fc2.weight lr_decay_rate 0.3486784401000001_get_param_groups name module.module.decoder.layers.12.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.28.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.31.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.1.input_layernorm.weight key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.22.self_attention.linear_proj.bias lr_decay_rate 0.81_get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.mlp.linear_fc2.weight key (1.0, 0.03486784401000001, False, False)_get_param_groups name module.module.decoder.layers.12.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.28.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.self_attention.linear_proj.bias key (0.0, 0.08100000000000002, False, False)_get_param_groups name module.module.decoder.layers.31.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.13.input_layernorm.weight key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.14.mlp.linear_fc2.bias lr_decay_rate 0.3486784401000001_get_param_groups name module.module.decoder.layers.1.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.28.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.14.mlp.linear_fc2.bias key (0.0, 0.03486784401000001, False, False)name module.module.external_feature_model.vit.decoder.layers.22.self_attention.linear_qkv.weight lr_decay_rate 0.81_get_param_groups name module.module.decoder.layers.31.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.1.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.28.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.13.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.31.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.self_attention.linear_qkv.weight key (1.0, 0.08100000000000002, False, False)_get_param_groups name module.module.decoder.layers.1.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.13.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.28.mlp.linear_fc1.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.15.ls1 lr_decay_rate 0.3874204890000001 _get_param_groups name module.module.decoder.layers.32.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.28.mlp.linear_fc2.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.22.self_attention.linear_qkv.bias lr_decay_rate 0.81 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.ls1 key (0.0, 0.03874204890000001, False, False)_get_param_groups name module.module.decoder.layers.13.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.1.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.self_attention.linear_qkv.bias key (0.0, 0.08100000000000002, False, False)_get_param_groups name module.module.decoder.layers.29.input_layernorm.weight key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.15.ls2 lr_decay_rate 0.3874204890000001 _get_param_groups name module.module.decoder.layers.1.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.32.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.13.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.ls2 key (0.0, 0.03874204890000001, False, False) _get_param_groups name module.module.decoder.layers.1.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.29.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.32.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.22.pre_mlp_layernorm.weight lr_decay_rate 0.81 _get_param_groups name module.module.decoder.layers.13.mlp.linear_fc1.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.15.input_layernorm.weight lr_decay_rate 0.3874204890000001 _get_param_groups name module.module.decoder.layers.2.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.29.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.32.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.pre_mlp_layernorm.weight key (0.0, 0.08100000000000002, False, False) _get_param_groups name module.module.decoder.layers.13.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.input_layernorm.weight key (0.0, 0.03874204890000001, False, False) _get_param_groups name module.module.decoder.layers.2.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.29.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.32.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.22.pre_mlp_layernorm.bias lr_decay_rate 0.81name module.module.external_feature_model.vit.decoder.layers.15.input_layernorm.bias lr_decay_rate 0.3874204890000001 _get_param_groups name module.module.decoder.layers.14.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.2.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.29.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.pre_mlp_layernorm.bias key (0.0, 0.08100000000000002, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.input_layernorm.bias key (0.0, 0.03874204890000001, False, False)_get_param_groups name module.module.decoder.layers.32.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.2.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.14.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.29.mlp.linear_fc1.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.22.mlp.linear_fc1.weight lr_decay_rate 0.81_get_param_groups name module.module.decoder.layers.32.mlp.linear_fc2.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.15.self_attention.linear_proj.weight lr_decay_rate 0.3874204890000001 _get_param_groups name module.module.decoder.layers.14.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.2.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.29.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.33.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.mlp.linear_fc1.weight key (1.0, 0.08100000000000002, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.self_attention.linear_proj.weight key (1.0, 0.03874204890000001, False, False) _get_param_groups name module.module.decoder.layers.30.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.2.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.14.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.22.mlp.linear_fc1.bias lr_decay_rate 0.81 _get_param_groups name module.module.decoder.layers.2.mlp.linear_fc2.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.15.self_attention.linear_proj.bias lr_decay_rate 0.3874204890000001 _get_param_groups name module.module.decoder.layers.33.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.30.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.14.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.mlp.linear_fc1.bias key (0.0, 0.08100000000000002, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.self_attention.linear_proj.bias key (0.0, 0.03874204890000001, False, False)_get_param_groups name module.module.decoder.layers.3.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.33.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.30.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.14.mlp.linear_fc1.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.22.mlp.linear_fc2.weight lr_decay_rate 0.81 _get_param_groups name module.module.decoder.layers.33.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.15.self_attention.linear_qkv.weight lr_decay_rate 0.3874204890000001 _get_param_groups name module.module.decoder.layers.3.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.30.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.14.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.mlp.linear_fc2.weight key (1.0, 0.08100000000000002, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.self_attention.linear_qkv.weight key (1.0, 0.03874204890000001, False, False) _get_param_groups name module.module.decoder.layers.3.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.33.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.30.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.15.input_layernorm.weight key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.22.mlp.linear_fc2.bias lr_decay_rate 0.81 name module.module.external_feature_model.vit.decoder.layers.15.self_attention.linear_qkv.bias lr_decay_rate 0.3874204890000001 _get_param_groups name module.module.decoder.layers.3.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.33.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.mlp.linear_fc2.bias key (0.0, 0.08100000000000002, False, False) _get_param_groups name module.module.decoder.layers.30.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.self_attention.linear_qkv.bias key (0.0, 0.03874204890000001, False, False) _get_param_groups name module.module.decoder.layers.15.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.33.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.3.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.30.mlp.linear_fc2.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.23.ls1 lr_decay_rate 0.9 _get_param_groups name module.module.decoder.layers.15.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.15.pre_mlp_layernorm.weight lr_decay_rate 0.3874204890000001 _get_param_groups name module.module.decoder.layers.3.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.34.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.ls1 key (0.0, 0.09000000000000001, False, False)_get_param_groups name module.module.decoder.layers.31.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.15.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.pre_mlp_layernorm.weight key (0.0, 0.03874204890000001, False, False) _get_param_groups name module.module.decoder.layers.3.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.34.self_attention.linear_proj.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.23.ls2 lr_decay_rate 0.9name module.module.external_feature_model.vit.decoder.layers.15.pre_mlp_layernorm.bias lr_decay_rate 0.3874204890000001 _get_param_groups name module.module.decoder.layers.4.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.31.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.15.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.34.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.ls2 key (0.0, 0.09000000000000001, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.pre_mlp_layernorm.bias key (0.0, 0.03874204890000001, False, False) _get_param_groups name module.module.decoder.layers.15.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.31.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.34.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.4.self_attention.linear_proj.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.23.input_layernorm.weight lr_decay_rate 0.9 _get_param_groups name module.module.decoder.layers.31.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.15.mlp.linear_fc1.weight lr_decay_rate 0.3874204890000001 _get_param_groups name module.module.decoder.layers.15.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.4.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.34.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.input_layernorm.weight key (0.0, 0.09000000000000001, False, False) _get_param_groups name module.module.decoder.layers.4.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.mlp.linear_fc1.weight key (1.0, 0.03874204890000001, False, False) _get_param_groups name module.module.decoder.layers.31.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.16.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.34.mlp.linear_fc1.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.23.input_layernorm.bias lr_decay_rate 0.9 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.input_layernorm.bias key (0.0, 0.09000000000000001, False, False)_get_param_groups name module.module.decoder.layers.34.mlp.linear_fc2.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.15.mlp.linear_fc1.bias lr_decay_rate 0.3874204890000001_get_param_groups name module.module.decoder.layers.31.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.4.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.16.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.mlp.linear_fc1.bias key (0.0, 0.03874204890000001, False, False)_get_param_groups name module.module.decoder.layers.35.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.16.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.31.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.4.mlp.linear_fc1.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.23.self_attention.linear_proj.weight lr_decay_rate 0.9 _get_param_groups name module.module.decoder.layers.16.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.15.mlp.linear_fc2.weight lr_decay_rate 0.3874204890000001 _get_param_groups name module.module.decoder.layers.4.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.35.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.32.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.self_attention.linear_proj.weight key (1.0, 0.09000000000000001, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.mlp.linear_fc2.weight key (1.0, 0.03874204890000001, False, False) _get_param_groups name module.module.decoder.layers.5.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.16.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.35.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.23.self_attention.linear_proj.bias lr_decay_rate 0.9 _get_param_groups name module.module.decoder.layers.32.self_attention.linear_proj.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.15.mlp.linear_fc2.bias lr_decay_rate 0.3874204890000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.self_attention.linear_proj.bias key (0.0, 0.09000000000000001, False, False)_get_param_groups name module.module.decoder.layers.35.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.16.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.5.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.32.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.15.mlp.linear_fc2.bias key (0.0, 0.03874204890000001, False, False) _get_param_groups name module.module.decoder.layers.32.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.16.mlp.linear_fc2.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.23.self_attention.linear_qkv.weight lr_decay_rate 0.9_get_param_groups name module.module.decoder.layers.5.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.35.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.16.ls1 lr_decay_rate 0.4304672100000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.self_attention.linear_qkv.weight key (1.0, 0.09000000000000001, False, False)_get_param_groups name module.module.decoder.layers.5.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.32.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.ls1 key (0.0, 0.04304672100000001, False, False)_get_param_groups name module.module.decoder.layers.17.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.35.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.35.mlp.linear_fc2.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.16.ls2 lr_decay_rate 0.4304672100000001name module.module.external_feature_model.vit.decoder.layers.23.self_attention.linear_qkv.bias lr_decay_rate 0.9 _get_param_groups name module.module.decoder.layers.32.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.17.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.5.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.ls2 key (0.0, 0.04304672100000001, False, False)_get_param_groups name module.module.decoder.layers.36.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.self_attention.linear_qkv.bias key (0.0, 0.09000000000000001, False, False) _get_param_groups name module.module.decoder.layers.17.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.32.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.5.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.17.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.5.mlp.linear_fc2.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.16.input_layernorm.weight lr_decay_rate 0.4304672100000001 _get_param_groups name module.module.decoder.layers.36.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.33.input_layernorm.weight key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.23.pre_mlp_layernorm.weight lr_decay_rate 0.9 _get_param_groups name module.module.decoder.layers.6.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.input_layernorm.weight key (0.0, 0.04304672100000001, False, False)_get_param_groups name module.module.decoder.layers.36.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.17.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.pre_mlp_layernorm.weight key (0.0, 0.09000000000000001, False, False) _get_param_groups name module.module.decoder.layers.33.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.36.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.23.pre_mlp_layernorm.bias lr_decay_rate 0.9 _get_param_groups name module.module.decoder.layers.17.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.33.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.16.input_layernorm.bias lr_decay_rate 0.4304672100000001_get_param_groups name module.module.decoder.layers.6.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.pre_mlp_layernorm.bias key (0.0, 0.09000000000000001, False, False)_get_param_groups name module.module.decoder.layers.33.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.input_layernorm.bias key (0.0, 0.04304672100000001, False, False)_get_param_groups name module.module.decoder.layers.36.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.17.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.6.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.6.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.23.mlp.linear_fc1.weight lr_decay_rate 0.9_get_param_groups name module.module.decoder.layers.36.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.33.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.18.input_layernorm.weight key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.16.self_attention.linear_proj.weight lr_decay_rate 0.4304672100000001 _get_param_groups name module.module.decoder.layers.36.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.6.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.mlp.linear_fc1.weight key (1.0, 0.09000000000000001, False, False)_get_param_groups name module.module.decoder.layers.33.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.self_attention.linear_proj.weight key (1.0, 0.04304672100000001, False, False)_get_param_groups name module.module.decoder.layers.18.self_attention.linear_proj.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.23.mlp.linear_fc1.bias lr_decay_rate 0.9_get_param_groups name module.module.decoder.layers.6.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.33.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.37.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.18.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.16.self_attention.linear_proj.bias lr_decay_rate 0.4304672100000001 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.mlp.linear_fc1.bias key (0.0, 0.09000000000000001, False, False) _get_param_groups name module.module.decoder.layers.6.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.18.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.34.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.self_attention.linear_proj.bias key (0.0, 0.04304672100000001, False, False) _get_param_groups name module.module.decoder.layers.37.self_attention.linear_proj.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.23.mlp.linear_fc2.weight lr_decay_rate 0.9 _get_param_groups name module.module.decoder.layers.7.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.37.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.16.self_attention.linear_qkv.weight lr_decay_rate 0.4304672100000001_get_param_groups name module.module.decoder.layers.34.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.18.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.mlp.linear_fc2.weight key (1.0, 0.09000000000000001, False, False) _get_param_groups name module.module.decoder.layers.37.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.7.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.self_attention.linear_qkv.weight key (1.0, 0.04304672100000001, False, False)_get_param_groups name module.module.decoder.layers.34.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.18.mlp.linear_fc1.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.23.mlp.linear_fc2.bias lr_decay_rate 0.9 _get_param_groups name module.module.decoder.layers.7.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.34.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.16.self_attention.linear_qkv.bias lr_decay_rate 0.4304672100000001_get_param_groups name module.module.decoder.layers.37.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.mlp.linear_fc2.bias key (0.0, 0.09000000000000001, False, False) _get_param_groups name module.module.decoder.layers.18.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.7.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.self_attention.linear_qkv.bias key (0.0, 0.04304672100000001, False, False) _get_param_groups name module.module.decoder.layers.37.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.34.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.19.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vision_projection.encoder.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.7.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.37.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.34.mlp.linear_fc1.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.16.pre_mlp_layernorm.weight lr_decay_rate 0.4304672100000001 _get_param_groups name module.module.decoder.layers.19.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.7.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vision_projection.encoder.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.34.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.38.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.pre_mlp_layernorm.weight key (0.0, 0.04304672100000001, False, False) _get_param_groups name module.module.decoder.layers.19.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.7.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.35.input_layernorm.weight key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.16.pre_mlp_layernorm.bias lr_decay_rate 0.4304672100000001_get_param_groups name module.module.external_feature_model.pre_proj_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.19.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.38.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.8.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.pre_mlp_layernorm.bias key (0.0, 0.04304672100000001, False, False) _get_param_groups name module.module.decoder.layers.38.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.pre_proj_layernorm.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.35.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.8.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.19.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.38.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.16.mlp.linear_fc1.weight lr_decay_rate 0.4304672100000001 _get_param_groups name module.module.decoder.layers.35.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.embedding.word_embeddings.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.8.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.19.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.mlp.linear_fc1.weight key (1.0, 0.04304672100000001, False, False) _get_param_groups name module.module.decoder.layers.35.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.38.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.8.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.19.mlp.linear_fc2.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.16.mlp.linear_fc1.bias lr_decay_rate 0.4304672100000001 _get_param_groups name module.module.decoder.layers.38.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.0.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.35.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.mlp.linear_fc1.bias key (0.0, 0.04304672100000001, False, False) _get_param_groups name module.module.decoder.layers.20.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.38.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.8.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.35.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.0.self_attention.linear_proj.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.16.mlp.linear_fc2.weight lr_decay_rate 0.4304672100000001 _get_param_groups name module.module.decoder.layers.39.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.20.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.8.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.35.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.mlp.linear_fc2.weight key (1.0, 0.04304672100000001, False, False) _get_param_groups name module.module.decoder.layers.8.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.20.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.0.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.36.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.39.self_attention.linear_proj.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.16.mlp.linear_fc2.bias lr_decay_rate 0.4304672100000001 _get_param_groups name module.module.decoder.layers.20.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.9.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.39.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.0.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.16.mlp.linear_fc2.bias key (0.0, 0.04304672100000001, False, False) _get_param_groups name module.module.decoder.layers.36.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.39.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.20.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.9.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.36.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.0.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.17.ls1 lr_decay_rate 0.4782969000000001 _get_param_groups name module.module.decoder.layers.9.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.20.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.39.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.36.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.ls1 key (0.0, 0.04782969000000001, False, False) _get_param_groups name module.module.decoder.layers.0.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.9.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.20.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.39.mlp.linear_fc1.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.17.ls2 lr_decay_rate 0.4782969000000001_get_param_groups name module.module.decoder.layers.0.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.36.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.21.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.9.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.39.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.ls2 key (0.0, 0.04782969000000001, False, False) _get_param_groups name module.module.decoder.layers.1.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.36.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.21.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.9.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.40.input_layernorm.weight key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.17.input_layernorm.weight lr_decay_rate 0.4782969000000001 _get_param_groups name module.module.decoder.layers.36.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.9.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.21.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.1.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.40.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.input_layernorm.weight key (0.0, 0.04782969000000001, False, False) _get_param_groups name module.module.decoder.layers.37.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.21.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.10.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.1.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.40.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.17.input_layernorm.bias lr_decay_rate 0.4782969000000001 _get_param_groups name module.module.decoder.layers.40.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.1.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.input_layernorm.bias key (0.0, 0.04782969000000001, False, False)_get_param_groups name module.module.decoder.layers.37.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.10.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.21.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.37.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.10.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.40.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.21.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.1.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.17.self_attention.linear_proj.weight lr_decay_rate 0.4782969000000001 _get_param_groups name module.module.decoder.layers.37.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.10.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.40.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.21.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.self_attention.linear_proj.weight key (1.0, 0.04782969000000001, False, False) _get_param_groups name module.module.decoder.layers.1.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.37.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.40.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.10.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.22.input_layernorm.weight key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.17.self_attention.linear_proj.bias lr_decay_rate 0.4782969000000001_get_param_groups name module.module.decoder.layers.1.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.37.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.41.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.10.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.22.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.self_attention.linear_proj.bias key (0.0, 0.04782969000000001, False, False) _get_param_groups name module.module.decoder.layers.2.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.37.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.10.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.41.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.22.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.17.self_attention.linear_qkv.weight lr_decay_rate 0.4782969000000001 _get_param_groups name module.module.decoder.layers.38.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.11.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.2.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.22.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.41.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.self_attention.linear_qkv.weight key (1.0, 0.04782969000000001, False, False) _get_param_groups name module.module.decoder.layers.2.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.11.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.38.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.41.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.22.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.17.self_attention.linear_qkv.bias lr_decay_rate 0.4782969000000001 _get_param_groups name module.module.decoder.layers.2.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.11.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.38.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.self_attention.linear_qkv.bias key (0.0, 0.04782969000000001, False, False) _get_param_groups name module.module.decoder.layers.22.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.41.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.11.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.38.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.2.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.22.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.41.mlp.linear_fc1.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.17.pre_mlp_layernorm.weight lr_decay_rate 0.4782969000000001 _get_param_groups name module.module.decoder.layers.2.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.11.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.41.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.23.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.38.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.pre_mlp_layernorm.weight key (0.0, 0.04782969000000001, False, False) _get_param_groups name module.module.decoder.layers.2.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.11.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.42.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.38.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.23.self_attention.linear_proj.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.17.pre_mlp_layernorm.bias lr_decay_rate 0.4782969000000001 _get_param_groups name module.module.decoder.layers.11.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.3.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.pre_mlp_layernorm.bias key (0.0, 0.04782969000000001, False, False)_get_param_groups name module.module.decoder.layers.23.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.38.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.42.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.12.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.23.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.17.mlp.linear_fc1.weight lr_decay_rate 0.4782969000000001 _get_param_groups name module.module.decoder.layers.42.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.39.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.3.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.12.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.mlp.linear_fc1.weight key (1.0, 0.04782969000000001, False, False)_get_param_groups name module.module.decoder.layers.42.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.23.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.3.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.39.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.12.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.17.mlp.linear_fc1.bias lr_decay_rate 0.4782969000000001 _get_param_groups name module.module.decoder.layers.23.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.42.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.3.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.39.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.12.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.mlp.linear_fc1.bias key (0.0, 0.04782969000000001, False, False) _get_param_groups name module.module.decoder.layers.23.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.42.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.39.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.17.mlp.linear_fc2.weight lr_decay_rate 0.4782969000000001_get_param_groups name module.module.decoder.layers.24.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.12.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.3.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.42.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.mlp.linear_fc2.weight key (1.0, 0.04782969000000001, False, False) _get_param_groups name module.module.decoder.layers.39.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.24.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.12.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.3.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.43.input_layernorm.weight key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.17.mlp.linear_fc2.bias lr_decay_rate 0.4782969000000001 _get_param_groups name module.module.decoder.layers.39.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.24.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.12.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.3.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.17.mlp.linear_fc2.bias key (0.0, 0.04782969000000001, False, False) _get_param_groups name module.module.decoder.layers.43.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.39.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.24.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.13.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.43.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.4.input_layernorm.weight key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.18.ls1 lr_decay_rate 0.531441 _get_param_groups name module.module.decoder.layers.40.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.43.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.24.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.13.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.ls1 key (0.0, 0.05314410000000001, False, False) _get_param_groups name module.module.decoder.layers.4.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.40.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.24.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.43.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.13.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.18.ls2 lr_decay_rate 0.531441 _get_param_groups name module.module.decoder.layers.4.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.40.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.13.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.24.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.43.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.ls2 key (0.0, 0.05314410000000001, False, False) _get_param_groups name module.module.decoder.layers.4.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.40.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.25.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.43.mlp.linear_fc2.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.18.input_layernorm.weight lr_decay_rate 0.531441_get_param_groups name module.module.decoder.layers.13.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.4.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.40.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.input_layernorm.weight key (0.0, 0.05314410000000001, False, False) _get_param_groups name module.module.decoder.layers.44.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.13.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.25.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.4.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.40.mlp.linear_fc1.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.18.input_layernorm.bias lr_decay_rate 0.531441 _get_param_groups name module.module.decoder.layers.25.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.13.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.44.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.4.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.40.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.input_layernorm.bias key (0.0, 0.05314410000000001, False, False) _get_param_groups name module.module.decoder.layers.25.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.14.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.44.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.5.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.41.input_layernorm.weight key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.18.self_attention.linear_proj.weight lr_decay_rate 0.531441_get_param_groups name module.module.decoder.layers.44.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.25.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.14.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.5.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.41.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.self_attention.linear_proj.weight key (1.0, 0.05314410000000001, False, False) _get_param_groups name module.module.decoder.layers.25.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.14.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.5.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.44.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.41.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.18.self_attention.linear_proj.bias lr_decay_rate 0.531441 _get_param_groups name module.module.decoder.layers.25.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.14.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.5.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.44.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.41.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.self_attention.linear_proj.bias key (0.0, 0.05314410000000001, False, False) _get_param_groups name module.module.decoder.layers.26.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.44.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.14.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.5.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.18.self_attention.linear_qkv.weight lr_decay_rate 0.531441 _get_param_groups name module.module.decoder.layers.41.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.26.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.45.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.14.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.self_attention.linear_qkv.weight key (1.0, 0.05314410000000001, False, False) _get_param_groups name module.module.decoder.layers.5.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.41.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.26.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.14.mlp.linear_fc2.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.18.self_attention.linear_qkv.bias lr_decay_rate 0.531441 _get_param_groups name module.module.decoder.layers.45.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.5.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.41.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.self_attention.linear_qkv.bias key (0.0, 0.05314410000000001, False, False)_get_param_groups name module.module.decoder.layers.26.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.15.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.45.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.6.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.42.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.45.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.15.self_attention.linear_proj.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.18.pre_mlp_layernorm.weight lr_decay_rate 0.531441_get_param_groups name module.module.decoder.layers.26.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.42.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.6.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.pre_mlp_layernorm.weight key (0.0, 0.05314410000000001, False, False)_get_param_groups name module.module.decoder.layers.15.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.45.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.26.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.42.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.6.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.15.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.18.pre_mlp_layernorm.bias lr_decay_rate 0.531441 _get_param_groups name module.module.decoder.layers.45.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.42.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.6.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.26.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.pre_mlp_layernorm.bias key (0.0, 0.05314410000000001, False, False) _get_param_groups name module.module.decoder.layers.45.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.15.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.42.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.6.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.27.input_layernorm.weight key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.18.mlp.linear_fc1.weight lr_decay_rate 0.531441_get_param_groups name module.module.decoder.layers.46.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.15.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.42.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.mlp.linear_fc1.weight key (1.0, 0.05314410000000001, False, False)_get_param_groups name module.module.decoder.layers.6.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.15.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.46.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.27.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.42.mlp.linear_fc2.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.18.mlp.linear_fc1.bias lr_decay_rate 0.531441_get_param_groups name module.module.decoder.layers.6.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.27.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.46.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.16.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.43.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.mlp.linear_fc1.bias key (0.0, 0.05314410000000001, False, False) _get_param_groups name module.module.decoder.layers.27.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.7.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.46.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.16.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.43.self_attention.linear_proj.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.18.mlp.linear_fc2.weight lr_decay_rate 0.531441 _get_param_groups name module.module.decoder.layers.27.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.7.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.46.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.16.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.mlp.linear_fc2.weight key (1.0, 0.05314410000000001, False, False)_get_param_groups name module.module.decoder.layers.43.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.27.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.16.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.7.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.46.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.43.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.18.mlp.linear_fc2.bias lr_decay_rate 0.531441 _get_param_groups name module.module.decoder.layers.27.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.46.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.16.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.7.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.18.mlp.linear_fc2.bias key (0.0, 0.05314410000000001, False, False) _get_param_groups name module.module.decoder.layers.43.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.28.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.16.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.43.mlp.linear_fc1.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.19.ls1 lr_decay_rate 0.5904900000000001_get_param_groups name module.module.decoder.layers.7.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.28.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.47.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.16.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.43.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.ls1 key (0.0, 0.05904900000000001, False, False) _get_param_groups name module.module.decoder.layers.28.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.7.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.17.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.47.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.44.input_layernorm.weight key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.19.ls2 lr_decay_rate 0.5904900000000001 _get_param_groups name module.module.decoder.layers.28.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.7.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.47.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.17.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.ls2 key (0.0, 0.05904900000000001, False, False) _get_param_groups name module.module.decoder.layers.44.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.28.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.47.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.8.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.17.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.19.input_layernorm.weight lr_decay_rate 0.5904900000000001 _get_param_groups name module.module.decoder.layers.44.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.28.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.17.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.input_layernorm.weight key (0.0, 0.05904900000000001, False, False) _get_param_groups name module.module.decoder.layers.47.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.8.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.44.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.28.mlp.linear_fc2.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.19.input_layernorm.bias lr_decay_rate 0.5904900000000001_get_param_groups name module.module.decoder.layers.47.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.8.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.17.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.29.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.44.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.47.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.input_layernorm.bias key (0.0, 0.05904900000000001, False, False) _get_param_groups name module.module.decoder.layers.8.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.17.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.29.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.44.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.final_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.17.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.8.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.19.self_attention.linear_proj.weight lr_decay_rate 0.5904900000000001 _get_param_groups name module.module.decoder.layers.29.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.44.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.output_layer.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.18.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.self_attention.linear_proj.weight key (1.0, 0.05904900000000001, False, False)_get_param_groups name module.module.decoder.layers.8.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.29.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.45.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.18.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.8.mlp.linear_fc2.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.19.self_attention.linear_proj.bias lr_decay_rate 0.5904900000000001 _get_param_groups name module.module.decoder.layers.29.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.45.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.18.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.self_attention.linear_proj.bias key (0.0, 0.05904900000000001, False, False) _get_param_groups name module.module.decoder.layers.9.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.29.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.45.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.18.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.19.self_attention.linear_qkv.weight lr_decay_rate 0.5904900000000001 _get_param_groups name module.module.decoder.layers.45.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.29.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.9.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.18.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.self_attention.linear_qkv.weight key (1.0, 0.05904900000000001, False, False) _get_param_groups name module.module.decoder.layers.9.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.30.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.45.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.18.mlp.linear_fc1.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.19.self_attention.linear_qkv.bias lr_decay_rate 0.5904900000000001 _get_param_groups name module.module.decoder.layers.9.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.18.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.self_attention.linear_qkv.bias key (0.0, 0.05904900000000001, False, False) _get_param_groups name module.module.decoder.layers.45.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.30.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.19.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.9.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.45.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.30.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.19.pre_mlp_layernorm.weight lr_decay_rate 0.5904900000000001 _get_param_groups name module.module.decoder.layers.30.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.9.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.pre_mlp_layernorm.weight key (0.0, 0.05904900000000001, False, False) _get_param_groups name module.module.decoder.layers.19.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.46.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.9.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.30.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.19.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.19.pre_mlp_layernorm.bias lr_decay_rate 0.5904900000000001 _get_param_groups name module.module.decoder.layers.46.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.pre_mlp_layernorm.bias key (0.0, 0.05904900000000001, False, False)_get_param_groups name module.module.decoder.layers.19.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.10.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.30.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.46.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.46.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.19.mlp.linear_fc1.weight lr_decay_rate 0.5904900000000001_get_param_groups name module.module.decoder.layers.30.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.19.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.10.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.mlp.linear_fc1.weight key (1.0, 0.05904900000000001, False, False) _get_param_groups name module.module.decoder.layers.31.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.19.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.10.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.46.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.19.mlp.linear_fc1.bias lr_decay_rate 0.5904900000000001 _get_param_groups name module.module.decoder.layers.19.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.10.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.31.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.46.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.mlp.linear_fc1.bias key (0.0, 0.05904900000000001, False, False) _get_param_groups name module.module.decoder.layers.20.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.31.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.46.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.10.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.19.mlp.linear_fc2.weight lr_decay_rate 0.5904900000000001 _get_param_groups name module.module.decoder.layers.31.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.20.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.mlp.linear_fc2.weight key (1.0, 0.05904900000000001, False, False)_get_param_groups name module.module.decoder.layers.10.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.31.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.20.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.47.input_layernorm.weight key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.19.mlp.linear_fc2.bias lr_decay_rate 0.5904900000000001 _get_param_groups name module.module.decoder.layers.10.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.20.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.31.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.19.mlp.linear_fc2.bias key (0.0, 0.05904900000000001, False, False) _get_param_groups name module.module.decoder.layers.11.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.47.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.31.mlp.linear_fc2.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.20.ls1 lr_decay_rate 0.6561_get_param_groups name module.module.decoder.layers.20.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.47.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.11.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.32.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.20.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.47.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.11.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.ls1 key (0.0, 0.06561, False, False) _get_param_groups name module.module.decoder.layers.20.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.32.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.11.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.47.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.20.ls2 lr_decay_rate 0.6561 _get_param_groups name module.module.decoder.layers.21.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.32.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.47.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.ls2 key (0.0, 0.06561, False, False) _get_param_groups name module.module.decoder.layers.11.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.32.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.21.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.47.mlp.linear_fc2.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.20.input_layernorm.weight lr_decay_rate 0.6561_get_param_groups name module.module.decoder.layers.11.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.32.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.21.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.final_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.input_layernorm.weight key (0.0, 0.06561, False, False) _get_param_groups name module.module.decoder.layers.11.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.21.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.32.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.output_layer.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.20.input_layernorm.bias lr_decay_rate 0.6561 _get_param_groups name module.module.decoder.layers.12.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.input_layernorm.bias key (0.0, 0.06561, False, False)_get_param_groups name module.module.decoder.layers.32.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.21.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.12.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.33.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.21.mlp.linear_fc1.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.20.self_attention.linear_proj.weight lr_decay_rate 0.6561 _get_param_groups name module.module.decoder.layers.12.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.21.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.self_attention.linear_proj.weight key (1.0, 0.06561, False, False) _get_param_groups name module.module.decoder.layers.33.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.12.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.22.input_layernorm.weight key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.20.self_attention.linear_proj.bias lr_decay_rate 0.6561 _get_param_groups name module.module.decoder.layers.33.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.12.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.self_attention.linear_proj.bias key (0.0, 0.06561, False, False) _get_param_groups name module.module.decoder.layers.33.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.22.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.12.mlp.linear_fc1.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.20.self_attention.linear_qkv.weight lr_decay_rate 0.6561_get_param_groups name module.module.decoder.layers.22.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.33.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.12.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.22.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.self_attention.linear_qkv.weight key (1.0, 0.06561, False, False) _get_param_groups name module.module.decoder.layers.33.mlp.linear_fc1.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.20.self_attention.linear_qkv.bias lr_decay_rate 0.6561_get_param_groups name module.module.decoder.layers.13.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.33.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.22.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.self_attention.linear_qkv.bias key (0.0, 0.06561, False, False) _get_param_groups name module.module.decoder.layers.22.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.34.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.13.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.22.mlp.linear_fc2.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.20.pre_mlp_layernorm.weight lr_decay_rate 0.6561_get_param_groups name module.module.decoder.layers.13.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.34.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.23.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.pre_mlp_layernorm.weight key (0.0, 0.06561, False, False) _get_param_groups name module.module.decoder.layers.13.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.34.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.20.pre_mlp_layernorm.bias lr_decay_rate 0.6561_get_param_groups name module.module.decoder.layers.23.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.34.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.13.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.pre_mlp_layernorm.bias key (0.0, 0.06561, False, False) _get_param_groups name module.module.decoder.layers.23.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.34.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.13.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.23.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.20.mlp.linear_fc1.weight lr_decay_rate 0.6561 _get_param_groups name module.module.decoder.layers.34.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.13.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.mlp.linear_fc1.weight key (1.0, 0.06561, False, False) _get_param_groups name module.module.decoder.layers.23.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.34.mlp.linear_fc2.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.20.mlp.linear_fc1.bias lr_decay_rate 0.6561_get_param_groups name module.module.decoder.layers.14.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.23.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.35.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.mlp.linear_fc1.bias key (0.0, 0.06561, False, False) _get_param_groups name module.module.decoder.layers.23.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.14.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.35.self_attention.linear_proj.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.20.mlp.linear_fc2.weight lr_decay_rate 0.6561_get_param_groups name module.module.decoder.layers.24.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.14.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.35.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.mlp.linear_fc2.weight key (1.0, 0.06561, False, False) _get_param_groups name module.module.decoder.layers.14.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.24.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.35.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.20.mlp.linear_fc2.bias lr_decay_rate 0.6561 _get_param_groups name module.module.decoder.layers.24.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.14.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.20.mlp.linear_fc2.bias key (0.0, 0.06561, False, False) _get_param_groups name module.module.decoder.layers.35.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.24.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.14.mlp.linear_fc1.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.21.ls1 lr_decay_rate 0.7290000000000001 _get_param_groups name module.module.decoder.layers.35.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.24.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.14.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.ls1 key (0.0, 0.0729, False, False)_get_param_groups name module.module.decoder.layers.35.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.24.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.15.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.36.input_layernorm.weight key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.21.ls2 lr_decay_rate 0.7290000000000001 _get_param_groups name module.module.decoder.layers.24.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.ls2 key (0.0, 0.0729, False, False)_get_param_groups name module.module.decoder.layers.25.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.36.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.15.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.15.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.36.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.21.input_layernorm.weight lr_decay_rate 0.7290000000000001 _get_param_groups name module.module.decoder.layers.25.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.15.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.36.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.input_layernorm.weight key (0.0, 0.0729, False, False) _get_param_groups name module.module.decoder.layers.25.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.25.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.21.input_layernorm.bias lr_decay_rate 0.7290000000000001 _get_param_groups name module.module.decoder.layers.36.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.15.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.input_layernorm.bias key (0.0, 0.0729, False, False) _get_param_groups name module.module.decoder.layers.25.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.36.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.15.mlp.linear_fc1.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.21.self_attention.linear_proj.weight lr_decay_rate 0.7290000000000001_get_param_groups name module.module.decoder.layers.25.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.36.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.15.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.self_attention.linear_proj.weight key (1.0, 0.0729, False, False) _get_param_groups name module.module.decoder.layers.25.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.37.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.16.input_layernorm.weight key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.21.self_attention.linear_proj.bias lr_decay_rate 0.7290000000000001_get_param_groups name module.module.decoder.layers.26.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.37.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.16.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.self_attention.linear_proj.bias key (0.0, 0.0729, False, False) _get_param_groups name module.module.decoder.layers.37.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.26.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.16.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.21.self_attention.linear_qkv.weight lr_decay_rate 0.7290000000000001 _get_param_groups name module.module.decoder.layers.37.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.26.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.16.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.self_attention.linear_qkv.weight key (1.0, 0.0729, False, False) _get_param_groups name module.module.decoder.layers.26.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.37.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.16.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.21.self_attention.linear_qkv.bias lr_decay_rate 0.7290000000000001 _get_param_groups name module.module.decoder.layers.37.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.26.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.self_attention.linear_qkv.bias key (0.0, 0.0729, False, False) _get_param_groups name module.module.decoder.layers.16.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.37.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.26.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.16.mlp.linear_fc2.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.21.pre_mlp_layernorm.weight lr_decay_rate 0.7290000000000001_get_param_groups name module.module.decoder.layers.26.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.38.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.17.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.pre_mlp_layernorm.weight key (0.0, 0.0729, False, False)_get_param_groups name module.module.decoder.layers.27.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.38.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.17.self_attention.linear_proj.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.21.pre_mlp_layernorm.bias lr_decay_rate 0.7290000000000001 _get_param_groups name module.module.decoder.layers.38.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.27.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.pre_mlp_layernorm.bias key (0.0, 0.0729, False, False) _get_param_groups name module.module.decoder.layers.17.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.38.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.27.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.21.mlp.linear_fc1.weight lr_decay_rate 0.7290000000000001_get_param_groups name module.module.decoder.layers.17.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.27.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.38.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.mlp.linear_fc1.weight key (1.0, 0.0729, False, False) _get_param_groups name module.module.decoder.layers.38.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.17.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.27.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.21.mlp.linear_fc1.bias lr_decay_rate 0.7290000000000001 _get_param_groups name module.module.decoder.layers.38.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.27.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.17.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.mlp.linear_fc1.bias key (0.0, 0.0729, False, False) _get_param_groups name module.module.decoder.layers.39.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.27.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.17.mlp.linear_fc2.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.21.mlp.linear_fc2.weight lr_decay_rate 0.7290000000000001 _get_param_groups name module.module.decoder.layers.39.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.mlp.linear_fc2.weight key (1.0, 0.0729, False, False) _get_param_groups name module.module.decoder.layers.28.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.18.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.39.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.21.mlp.linear_fc2.bias lr_decay_rate 0.7290000000000001 _get_param_groups name module.module.decoder.layers.28.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.39.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.18.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.21.mlp.linear_fc2.bias key (0.0, 0.0729, False, False) _get_param_groups name module.module.decoder.layers.28.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.39.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.18.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.22.ls1 lr_decay_rate 0.81 _get_param_groups name module.module.decoder.layers.28.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.39.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.18.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.ls1 key (0.0, 0.08100000000000002, False, False) _get_param_groups name module.module.decoder.layers.28.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.39.mlp.linear_fc2.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.22.ls2 lr_decay_rate 0.81 _get_param_groups name module.module.decoder.layers.28.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.18.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.ls2 key (0.0, 0.08100000000000002, False, False) _get_param_groups name module.module.decoder.layers.40.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.28.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.18.mlp.linear_fc1.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.22.input_layernorm.weight lr_decay_rate 0.81 _get_param_groups name module.module.decoder.layers.40.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.29.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.18.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.input_layernorm.weight key (0.0, 0.08100000000000002, False, False) _get_param_groups name module.module.decoder.layers.40.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.40.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.19.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.29.self_attention.linear_proj.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.22.input_layernorm.bias lr_decay_rate 0.81 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.input_layernorm.bias key (0.0, 0.08100000000000002, False, False)_get_param_groups name module.module.decoder.layers.29.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.19.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.40.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.29.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.19.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.40.mlp.linear_fc1.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.22.self_attention.linear_proj.weight lr_decay_rate 0.81 _get_param_groups name module.module.decoder.layers.19.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.29.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.40.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.self_attention.linear_proj.weight key (1.0, 0.08100000000000002, False, False) _get_param_groups name module.module.decoder.layers.19.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.29.mlp.linear_fc1.weight key (1.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.22.self_attention.linear_proj.bias lr_decay_rate 0.81_get_param_groups name module.module.decoder.layers.41.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.self_attention.linear_proj.bias key (0.0, 0.08100000000000002, False, False) _get_param_groups name module.module.decoder.layers.29.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.19.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.41.self_attention.linear_proj.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.22.self_attention.linear_qkv.weight lr_decay_rate 0.81 _get_param_groups name module.module.decoder.layers.30.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.19.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.41.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.self_attention.linear_qkv.weight key (1.0, 0.08100000000000002, False, False) _get_param_groups name module.module.decoder.layers.41.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.20.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.30.self_attention.linear_proj.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.22.self_attention.linear_qkv.bias lr_decay_rate 0.81 _get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.self_attention.linear_qkv.bias key (0.0, 0.08100000000000002, False, False) _get_param_groups name module.module.decoder.layers.30.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.41.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.20.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.30.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.22.pre_mlp_layernorm.weight lr_decay_rate 0.81 _get_param_groups name module.module.decoder.layers.41.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.20.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.30.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.pre_mlp_layernorm.weight key (0.0, 0.08100000000000002, False, False) _get_param_groups name module.module.decoder.layers.20.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.41.mlp.linear_fc2.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.22.pre_mlp_layernorm.bias lr_decay_rate 0.81_get_param_groups name module.module.decoder.layers.30.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.42.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.20.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.pre_mlp_layernorm.bias key (0.0, 0.08100000000000002, False, False) _get_param_groups name module.module.decoder.layers.30.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.42.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.20.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.31.input_layernorm.weight key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.22.mlp.linear_fc1.weight lr_decay_rate 0.81 _get_param_groups name module.module.decoder.layers.42.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.20.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.mlp.linear_fc1.weight key (1.0, 0.08100000000000002, False, False)_get_param_groups name module.module.decoder.layers.31.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.42.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.22.mlp.linear_fc1.bias lr_decay_rate 0.81 _get_param_groups name module.module.decoder.layers.31.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.21.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.mlp.linear_fc1.bias key (0.0, 0.08100000000000002, False, False) _get_param_groups name module.module.decoder.layers.31.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.42.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.21.self_attention.linear_proj.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.22.mlp.linear_fc2.weight lr_decay_rate 0.81 _get_param_groups name module.module.decoder.layers.42.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.31.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.21.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.mlp.linear_fc2.weight key (1.0, 0.08100000000000002, False, False) _get_param_groups name module.module.decoder.layers.42.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.31.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.21.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.22.mlp.linear_fc2.bias lr_decay_rate 0.81 _get_param_groups name module.module.decoder.layers.43.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.31.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.22.mlp.linear_fc2.bias key (0.0, 0.08100000000000002, False, False) _get_param_groups name module.module.decoder.layers.21.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.32.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.43.self_attention.linear_proj.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.23.ls1 lr_decay_rate 0.9 _get_param_groups name module.module.decoder.layers.21.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.32.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.43.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.ls1 key (0.0, 0.09000000000000001, False, False) _get_param_groups name module.module.decoder.layers.21.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.43.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.32.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.23.ls2 lr_decay_rate 0.9 _get_param_groups name module.module.decoder.layers.22.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.32.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.ls2 key (0.0, 0.09000000000000001, False, False) _get_param_groups name module.module.decoder.layers.43.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.22.self_attention.linear_proj.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.23.input_layernorm.weight lr_decay_rate 0.9 _get_param_groups name module.module.decoder.layers.43.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.32.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.22.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.input_layernorm.weight key (0.0, 0.09000000000000001, False, False) _get_param_groups name module.module.decoder.layers.43.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.22.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.32.mlp.linear_fc1.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.23.input_layernorm.bias lr_decay_rate 0.9 _get_param_groups name module.module.decoder.layers.44.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.32.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.22.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.input_layernorm.bias key (0.0, 0.09000000000000001, False, False) _get_param_groups name module.module.decoder.layers.33.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.44.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.22.mlp.linear_fc1.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.23.self_attention.linear_proj.weight lr_decay_rate 0.9 _get_param_groups name module.module.decoder.layers.44.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.22.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.33.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.self_attention.linear_proj.weight key (1.0, 0.09000000000000001, False, False) _get_param_groups name module.module.decoder.layers.44.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.33.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.23.input_layernorm.weight key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.23.self_attention.linear_proj.bias lr_decay_rate 0.9 _get_param_groups name module.module.decoder.layers.33.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.self_attention.linear_proj.bias key (0.0, 0.09000000000000001, False, False) _get_param_groups name module.module.decoder.layers.44.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.23.self_attention.linear_proj.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.23.self_attention.linear_qkv.weight lr_decay_rate 0.9_get_param_groups name module.module.decoder.layers.44.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.33.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.23.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.self_attention.linear_qkv.weight key (1.0, 0.09000000000000001, False, False)_get_param_groups name module.module.decoder.layers.44.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.23.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.33.mlp.linear_fc1.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.23.self_attention.linear_qkv.bias lr_decay_rate 0.9_get_param_groups name module.module.decoder.layers.45.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.33.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.23.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.self_attention.linear_qkv.bias key (0.0, 0.09000000000000001, False, False) _get_param_groups name module.module.decoder.layers.34.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.45.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.23.mlp.linear_fc1.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.23.pre_mlp_layernorm.weight lr_decay_rate 0.9_get_param_groups name module.module.decoder.layers.45.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.34.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.23.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.45.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.pre_mlp_layernorm.weight key (0.0, 0.09000000000000001, False, False)_get_param_groups name module.module.decoder.layers.34.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.24.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.34.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.23.pre_mlp_layernorm.bias lr_decay_rate 0.9 _get_param_groups name module.module.decoder.layers.45.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.24.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.pre_mlp_layernorm.bias key (0.0, 0.09000000000000001, False, False) _get_param_groups name module.module.decoder.layers.45.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.34.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.24.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.23.mlp.linear_fc1.weight lr_decay_rate 0.9 _get_param_groups name module.module.decoder.layers.45.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.34.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.24.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.mlp.linear_fc1.weight key (1.0, 0.09000000000000001, False, False) _get_param_groups name module.module.decoder.layers.46.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.34.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.24.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)name module.module.external_feature_model.vit.decoder.layers.23.mlp.linear_fc1.bias lr_decay_rate 0.9_get_param_groups name module.module.decoder.layers.35.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.46.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.mlp.linear_fc1.bias key (0.0, 0.09000000000000001, False, False) _get_param_groups name module.module.decoder.layers.24.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.46.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.35.self_attention.linear_proj.weight key (1.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.23.mlp.linear_fc2.weight lr_decay_rate 0.9_get_param_groups name module.module.decoder.layers.24.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.46.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.35.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.mlp.linear_fc2.weight key (1.0, 0.09000000000000001, False, False) _get_param_groups name module.module.decoder.layers.35.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.25.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.46.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) name module.module.external_feature_model.vit.decoder.layers.23.mlp.linear_fc2.bias lr_decay_rate 0.9 _get_param_groups name module.module.decoder.layers.35.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.25.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.46.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vit.decoder.layers.23.mlp.linear_fc2.bias key (0.0, 0.09000000000000001, False, False) _get_param_groups name module.module.decoder.layers.35.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.25.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.46.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.35.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vision_projection.encoder.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.25.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.36.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.vision_projection.encoder.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.47.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.25.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.36.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.pre_proj_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.25.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.47.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.36.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.external_feature_model.pre_proj_layernorm.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.25.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.47.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.36.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.47.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.26.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.embedding.word_embeddings.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.36.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.47.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.26.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.36.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.0.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.47.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.26.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.36.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.0.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.47.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.26.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.37.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.final_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.0.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.26.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.37.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.0.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.output_layer.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.26.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.37.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.0.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.26.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.37.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.0.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.27.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.37.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.0.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.37.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.27.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.1.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.37.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.27.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.1.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.27.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.38.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.1.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.1.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.27.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.38.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.38.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.27.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.1.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.38.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.27.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.1.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.28.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.38.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.1.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.38.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.28.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.2.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.38.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.28.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.2.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.28.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.39.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.28.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.2.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.39.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.2.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.39.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.28.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.39.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.28.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.2.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.39.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.29.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.2.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.39.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.2.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.29.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.39.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.3.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.29.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.40.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.29.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.3.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.40.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.3.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.29.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.3.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.29.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.40.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.40.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.29.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.3.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.30.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.3.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.40.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.40.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.3.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.30.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.40.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.30.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.4.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.30.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.41.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.4.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.41.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.30.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.4.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.41.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.4.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.30.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.41.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.30.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.4.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.31.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.41.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.4.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.41.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.4.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.31.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.41.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.5.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.31.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.42.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.31.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.5.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.42.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.5.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.31.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.42.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.5.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.31.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.42.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.31.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.5.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.42.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.32.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.5.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.42.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.32.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.5.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.42.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.32.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.6.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.43.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.32.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.6.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.43.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.32.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.6.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.43.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.32.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.6.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.43.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.32.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.6.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.43.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.33.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.6.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.43.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.33.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.6.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.43.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.33.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.7.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.44.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.33.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.7.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.44.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.7.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.33.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.44.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.7.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.44.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.33.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.33.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.44.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.7.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.34.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.44.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.7.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.44.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.7.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.34.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.45.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.34.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.8.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.34.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.45.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.8.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.45.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.8.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.34.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.45.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.8.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.34.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.34.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.8.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.45.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.35.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.45.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.8.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.8.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.45.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.35.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.9.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.46.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.35.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.35.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.9.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.46.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.35.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.46.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.9.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.46.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.9.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.35.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.35.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.46.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.9.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.46.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.36.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.9.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.46.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.9.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.36.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.10.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.36.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.47.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.36.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.10.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.47.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.10.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.36.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.47.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.10.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.36.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.47.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.36.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.10.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.47.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.37.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.10.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.47.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.10.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.37.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.47.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.11.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.37.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.final_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.37.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.11.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.output_layer.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.11.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.37.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.11.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.37.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.11.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.37.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.11.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.38.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.11.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.38.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.12.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.38.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.38.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.12.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.12.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.38.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.12.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.38.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.12.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.38.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.12.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.39.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.12.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.39.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.13.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.39.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.13.self_attention.linear_proj.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.39.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.13.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.39.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.13.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.39.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.39.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.13.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.40.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.13.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.13.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.40.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.40.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.14.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.40.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.14.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.14.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.40.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.14.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.40.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.40.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.14.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.41.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.14.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.14.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.41.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.15.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.41.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.41.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.15.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.15.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.41.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.15.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.41.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.41.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.15.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.42.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.15.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.15.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.42.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.16.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.42.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.42.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.16.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.16.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.42.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.16.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.42.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.42.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.16.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.16.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.43.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.16.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.43.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.17.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.43.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.43.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.17.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.17.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.43.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.17.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.43.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.17.pre_mlp_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.43.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.17.mlp.linear_fc1.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.44.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.17.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.44.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.18.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.44.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.44.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.18.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.18.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.44.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.18.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.44.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.44.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.18.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.45.input_layernorm.weight key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.18.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.18.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.45.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.45.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.19.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.45.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.19.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.19.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.45.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.19.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.45.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.45.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.19.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.46.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.19.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.19.mlp.linear_fc2.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.46.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.46.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.20.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.46.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.20.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.20.self_attention.linear_qkv.weight key (1.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.46.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.20.self_attention.linear_qkv.bias key (0.0, 1.0, False, False)_get_param_groups name module.module.decoder.layers.46.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.46.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.20.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.20.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.47.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.20.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.47.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.21.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.47.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.21.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.47.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.21.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.47.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.21.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.47.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.21.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.47.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.21.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.final_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.21.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.output_layer.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.22.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.22.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.22.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.22.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.22.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.22.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.22.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.23.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.23.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.23.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.23.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.23.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.23.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.23.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.24.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.24.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.24.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.24.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.24.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.24.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.24.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.25.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.25.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.25.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.25.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.25.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.25.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.25.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.26.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.26.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.26.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.26.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.26.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.26.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.26.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.27.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.27.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.27.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.27.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.27.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.27.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.27.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.28.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.28.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.28.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.28.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.28.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.28.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.28.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.29.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.29.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.29.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.29.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.29.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.29.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.29.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.30.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.30.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.30.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.30.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.30.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.30.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.30.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.31.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.31.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.31.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.31.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.31.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.31.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.31.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.32.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.32.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.32.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.32.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.32.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.32.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.32.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.33.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.33.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.33.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.33.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.33.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.33.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.33.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.34.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.34.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.34.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.34.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.34.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.34.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.34.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.35.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.35.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.35.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.35.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.35.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.35.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.35.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.36.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.36.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.36.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.36.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.36.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.36.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.36.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.37.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.37.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.37.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.37.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.37.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.37.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.37.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.38.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.38.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.38.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.38.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.38.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.38.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.38.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.39.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.39.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.39.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.39.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.39.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.39.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.39.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.40.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.40.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.40.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.40.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.40.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.40.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.40.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.41.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.41.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.41.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.41.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.41.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.41.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.41.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.42.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.42.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.42.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.42.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.42.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.42.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.42.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.43.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.43.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.43.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.43.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.43.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.43.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.43.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.44.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.44.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.44.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.44.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.44.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.44.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.44.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.45.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.45.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.45.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.45.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.45.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.45.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.45.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.46.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.46.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.46.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.46.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.46.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.46.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.46.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.47.input_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.47.self_attention.linear_proj.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.47.self_attention.linear_qkv.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.47.self_attention.linear_qkv.bias key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.47.pre_mlp_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.47.mlp.linear_fc1.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.layers.47.mlp.linear_fc2.weight key (1.0, 1.0, False, False) _get_param_groups name module.module.decoder.final_layernorm.weight key (0.0, 1.0, False, False) _get_param_groups name module.module.output_layer.weight key (1.0, 1.0, False, False) _load_base_checkpoint iteration_load_base_checkpoint iteration_load_base_checkpoint iteration_load_base_checkpoint iteration_load_base_checkpoint iteration_load_base_checkpoint iteration_load_base_checkpoint iteration_load_base_checkpoint iteration _load_base_checkpoint iteration_load_base_checkpoint iteration _load_base_checkpoint iteration_load_base_checkpoint iteration_load_base_checkpoint iteration_load_base_checkpoint iteration 10001000_load_base_checkpoint iteration _load_base_checkpoint iteration_load_base_checkpoint release 10001000 100010001000 10001000 10001000 10001000 1000_load_base_checkpoint release_load_base_checkpoint release_load_base_checkpoint release1000 _load_base_checkpoint release_load_base_checkpoint releaseFalse1000 _load_base_checkpoint release_load_base_checkpoint release_load_base_checkpoint release _load_base_checkpoint release_load_base_checkpoint release_load_base_checkpoint release False _load_base_checkpoint release_load_base_checkpoint release _load_base_checkpoint releaseFalse FalseFalseFalse FalseFalseFalse _load_base_checkpoint releaseFalse FalseFalse False FalseFalse False _load_base_checkpoint /data_2/output/LM/lcvlm_modellink/scripts/qwen25/pretrain_qwen25_14b_intern_300m_ptd_tp8pp1_stage1.sh/20241012_095536/iter_0001000/mp_rank_03/model_optim_rng.pt _load_base_checkpoint /data_2/output/LM/lcvlm_modellink/scripts/qwen25/pretrain_qwen25_14b_intern_300m_ptd_tp8pp1_stage1.sh/20241012_095536/iter_0001000/mp_rank_06/model_optim_rng.pt _load_base_checkpoint /data_2/output/LM/lcvlm_modellink/scripts/qwen25/pretrain_qwen25_14b_intern_300m_ptd_tp8pp1_stage1.sh/20241012_095536/iter_0001000/mp_rank_07/model_optim_rng.pt _load_base_checkpoint_load_base_checkpoint_load_base_checkpoint /data_2/output/LM/lcvlm_modellink/scripts/qwen25/pretrain_qwen25_14b_intern_300m_ptd_tp8pp1_stage1.sh/20241012_095536/iter_0001000/mp_rank_05/model_optim_rng.pt/data_2/output/LM/lcvlm_modellink/scripts/qwen25/pretrain_qwen25_14b_intern_300m_ptd_tp8pp1_stage1.sh/20241012_095536/iter_0001000/mp_rank_00/model_optim_rng.pt/data_2/output/LM/lcvlm_modellink/scripts/qwen25/pretrain_qwen25_14b_intern_300m_ptd_tp8pp1_stage1.sh/20241012_095536/iter_0001000/mp_rank_01/model_optim_rng.pt _load_base_checkpoint_load_base_checkpoint /data_2/output/LM/lcvlm_modellink/scripts/qwen25/pretrain_qwen25_14b_intern_300m_ptd_tp8pp1_stage1.sh/20241012_095536/iter_0001000/mp_rank_05/model_optim_rng.pt /data_2/output/LM/lcvlm_modellink/scripts/qwen25/pretrain_qwen25_14b_intern_300m_ptd_tp8pp1_stage1.sh/20241012_095536/iter_0001000/mp_rank_02/model_optim_rng.pt _load_base_checkpoint /data_2/output/LM/lcvlm_modellink/scripts/qwen25/pretrain_qwen25_14b_intern_300m_ptd_tp8pp1_stage1.sh/20241012_095536/iter_0001000/mp_rank_04/model_optim_rng.pt _load_base_checkpoint /data_2/output/LM/lcvlm_modellink/scripts/qwen25/pretrain_qwen25_14b_intern_300m_ptd_tp8pp1_stage1.sh/20241012_095536/iter_0001000/mp_rank_01/model_optim_rng.pt_load_base_checkpoint /data_2/output/LM/lcvlm_modellink/scripts/qwen25/pretrain_qwen25_14b_intern_300m_ptd_tp8pp1_stage1.sh/20241012_095536/iter_0001000/mp_rank_06/model_optim_rng.pt _load_base_checkpoint /data_2/output/LM/lcvlm_modellink/scripts/qwen25/pretrain_qwen25_14b_intern_300m_ptd_tp8pp1_stage1.sh/20241012_095536/iter_0001000/mp_rank_03/model_optim_rng.pt _load_base_checkpoint_load_base_checkpoint /data_2/output/LM/lcvlm_modellink/scripts/qwen25/pretrain_qwen25_14b_intern_300m_ptd_tp8pp1_stage1.sh/20241012_095536/iter_0001000/mp_rank_07/model_optim_rng.pt/data_2/output/LM/lcvlm_modellink/scripts/qwen25/pretrain_qwen25_14b_intern_300m_ptd_tp8pp1_stage1.sh/20241012_095536/iter_0001000/mp_rank_02/model_optim_rng.pt _load_base_checkpoint /data_2/output/LM/lcvlm_modellink/scripts/qwen25/pretrain_qwen25_14b_intern_300m_ptd_tp8pp1_stage1.sh/20241012_095536/iter_0001000/mp_rank_00/model_optim_rng.pt _load_base_checkpoint /data_2/output/LM/lcvlm_modellink/scripts/qwen25/pretrain_qwen25_14b_intern_300m_ptd_tp8pp1_stage1.sh/20241012_095536/iter_0001000/mp_rank_04/model_optim_rng.pt load_checkpoint iteration 0 load_checkpoint release False strict True load_checkpoint iteration 0 load_checkpoint release False strict True load_checkpoint iteration 0 load_checkpoint release False strict True load_checkpoint iteration 0 load_checkpoint release False strict True load_checkpoint iteration 0 load_checkpoint release False strict True load_checkpoint iteration 0 load_checkpoint release False strict True load_checkpoint iteration 0 load_checkpoint release False strict True load_checkpoint iteration 0 load_checkpoint release False strict True load_checkpoint iteration 0 load_checkpoint release False strict True load_checkpoint iteration 0 load_checkpoint release False strict True load_checkpoint iteration 0 load_checkpoint release False strict True load_checkpoint iteration 0 load_checkpoint release False strict True load_checkpoint iteration 0 load_checkpoint release False strict True load_checkpoint iteration 0 load_checkpoint release False strict True load_checkpoint iteration 0 load_checkpoint release False strict True load_checkpoint iteration 0 load_checkpoint release False strict True local_disk/cognitron_vl/third_party/Megatron-LM_core_r0.6.0/megatron/core/timers.py:238: UserWarning: AutoNonVariableTypeMode is deprecated and will be removed in 1.10 release. For kernel implementations please use AutoDispatchBelowADInplaceOrView instead, If you are looking for a user facing API to enable running your inference-only workload, please use c10::InferenceMode. Using AutoDispatchBelowADInplaceOrView in user code is under risk of producing silent wrong result in some edge cases. See Note [AutoDispatchBelowAutograd] for more details. (Triggered internally at torch_npu/csrc/aten/common/TensorFactories.cpp:74.) rank_name_to_time[rank, i] = self._timers[name].elapsed(reset=reset) local_disk/cognitron_vl/third_party/Megatron-LM_core_r0.6.0/megatron/core/timers.py:238: UserWarning: AutoNonVariableTypeMode is deprecated and will be removed in 1.10 release. For kernel implementations please use AutoDispatchBelowADInplaceOrView instead, If you are looking for a user facing API to enable running your inference-only workload, please use c10::InferenceMode. Using AutoDispatchBelowADInplaceOrView in user code is under risk of producing silent wrong result in some edge cases. See Note [AutoDispatchBelowAutograd] for more details. (Triggered internally at torch_npu/csrc/aten/common/TensorFactories.cpp:74.) rank_name_to_time[rank, i] = self._timers[name].elapsed(reset=reset) local_disk/cognitron_vl/third_party/Megatron-LM_core_r0.6.0/megatron/core/timers.py:238: UserWarning: AutoNonVariableTypeMode is deprecated and will be removed in 1.10 release. For kernel implementations please use AutoDispatchBelowADInplaceOrView instead, If you are looking for a user facing API to enable running your inference-only workload, please use c10::InferenceMode. Using AutoDispatchBelowADInplaceOrView in user code is under risk of producing silent wrong result in some edge cases. See Note [AutoDispatchBelowAutograd] for more details. (Triggered internally at torch_npu/csrc/aten/common/TensorFactories.cpp:74.) rank_name_to_time[rank, i] = self._timers[name].elapsed(reset=reset) local_disk/cognitron_vl/third_party/Megatron-LM_core_r0.6.0/megatron/core/timers.py:238: UserWarning: AutoNonVariableTypeMode is deprecated and will be removed in 1.10 release. For kernel implementations please use AutoDispatchBelowADInplaceOrView instead, If you are looking for a user facing API to enable running your inference-only workload, please use c10::InferenceMode. Using AutoDispatchBelowADInplaceOrView in user code is under risk of producing silent wrong result in some edge cases. See Note [AutoDispatchBelowAutograd] for more details. (Triggered internally at torch_npu/csrc/aten/common/TensorFactories.cpp:74.) rank_name_to_time[rank, i] = self._timers[name].elapsed(reset=reset) local_disk/cognitron_vl/third_party/Megatron-LM_core_r0.6.0/megatron/core/timers.py:238: UserWarning: AutoNonVariableTypeMode is deprecated and will be removed in 1.10 release. For kernel implementations please use AutoDispatchBelowADInplaceOrView instead, If you are looking for a user facing API to enable running your inference-only workload, please use c10::InferenceMode. Using AutoDispatchBelowADInplaceOrView in user code is under risk of producing silent wrong result in some edge cases. See Note [AutoDispatchBelowAutograd] for more details. (Triggered internally at torch_npu/csrc/aten/common/TensorFactories.cpp:74.) rank_name_to_time[rank, i] = self._timers[name].elapsed(reset=reset) local_disk/cognitron_vl/third_party/Megatron-LM_core_r0.6.0/megatron/core/timers.py:238: UserWarning: AutoNonVariableTypeMode is deprecated and will be removed in 1.10 release. For kernel implementations please use AutoDispatchBelowADInplaceOrView instead, If you are looking for a user facing API to enable running your inference-only workload, please use c10::InferenceMode. Using AutoDispatchBelowADInplaceOrView in user code is under risk of producing silent wrong result in some edge cases. See Note [AutoDispatchBelowAutograd] for more details. (Triggered internally at torch_npu/csrc/aten/common/TensorFactories.cpp:74.) rank_name_to_time[rank, i] = self._timers[name].elapsed(reset=reset) local_disk/cognitron_vl/third_party/Megatron-LM_core_r0.6.0/megatron/core/timers.py:238: UserWarning: AutoNonVariableTypeMode is deprecated and will be removed in 1.10 release. For kernel implementations please use AutoDispatchBelowADInplaceOrView instead, If you are looking for a user facing API to enable running your inference-only workload, please use c10::InferenceMode. Using AutoDispatchBelowADInplaceOrView in user code is under risk of producing silent wrong result in some edge cases. See Note [AutoDispatchBelowAutograd] for more details. (Triggered internally at torch_npu/csrc/aten/common/TensorFactories.cpp:74.) rank_name_to_time[rank, i] = self._timers[name].elapsed(reset=reset) local_disk/cognitron_vl/third_party/Megatron-LM_core_r0.6.0/megatron/core/timers.py:238: UserWarning: AutoNonVariableTypeMode is deprecated and will be removed in 1.10 release. For kernel implementations please use AutoDispatchBelowADInplaceOrView instead, If you are looking for a user facing API to enable running your inference-only workload, please use c10::InferenceMode. Using AutoDispatchBelowADInplaceOrView in user code is under risk of producing silent wrong result in some edge cases. See Note [AutoDispatchBelowAutograd] for more details. (Triggered internally at torch_npu/csrc/aten/common/TensorFactories.cpp:74.) rank_name_to_time[rank, i] = self._timers[name].elapsed(reset=reset) local_disk/cognitron_vl/third_party/Megatron-LM_core_r0.6.0/megatron/core/timers.py:238: UserWarning: AutoNonVariableTypeMode is deprecated and will be removed in 1.10 release. For kernel implementations please use AutoDispatchBelowADInplaceOrView instead, If you are looking for a user facing API to enable running your inference-only workload, please use c10::InferenceMode. Using AutoDispatchBelowADInplaceOrView in user code is under risk of producing silent wrong result in some edge cases. See Note [AutoDispatchBelowAutograd] for more details. (Triggered internally at torch_npu/csrc/aten/common/TensorFactories.cpp:74.) rank_name_to_time[rank, i] = self._timers[name].elapsed(reset=reset) local_disk/cognitron_vl/third_party/Megatron-LM_core_r0.6.0/megatron/core/timers.py:238: UserWarning: AutoNonVariableTypeMode is deprecated and will be removed in 1.10 release. For kernel implementations please use AutoDispatchBelowADInplaceOrView instead, If you are looking for a user facing API to enable running your inference-only workload, please use c10::InferenceMode. Using AutoDispatchBelowADInplaceOrView in user code is under risk of producing silent wrong result in some edge cases. See Note [AutoDispatchBelowAutograd] for more details. (Triggered internally at torch_npu/csrc/aten/common/TensorFactories.cpp:74.) rank_name_to_time[rank, i] = self._timers[name].elapsed(reset=reset) local_disk/cognitron_vl/third_party/Megatron-LM_core_r0.6.0/megatron/core/timers.py:238: UserWarning: AutoNonVariableTypeMode is deprecated and will be removed in 1.10 release. For kernel implementations please use AutoDispatchBelowADInplaceOrView instead, If you are looking for a user facing API to enable running your inference-only workload, please use c10::InferenceMode. Using AutoDispatchBelowADInplaceOrView in user code is under risk of producing silent wrong result in some edge cases. See Note [AutoDispatchBelowAutograd] for more details. (Triggered internally at torch_npu/csrc/aten/common/TensorFactories.cpp:74.) rank_name_to_time[rank, i] = self._timers[name].elapsed(reset=reset) local_disk/cognitron_vl/third_party/Megatron-LM_core_r0.6.0/megatron/core/timers.py:238: UserWarning: AutoNonVariableTypeMode is deprecated and will be removed in 1.10 release. For kernel implementations please use AutoDispatchBelowADInplaceOrView instead, If you are looking for a user facing API to enable running your inference-only workload, please use c10::InferenceMode. Using AutoDispatchBelowADInplaceOrView in user code is under risk of producing silent wrong result in some edge cases. See Note [AutoDispatchBelowAutograd] for more details. (Triggered internally at torch_npu/csrc/aten/common/TensorFactories.cpp:74.) rank_name_to_time[rank, i] = self._timers[name].elapsed(reset=reset) local_disk/cognitron_vl/third_party/Megatron-LM_core_r0.6.0/megatron/core/timers.py:238: UserWarning: AutoNonVariableTypeMode is deprecated and will be removed in 1.10 release. For kernel implementations please use AutoDispatchBelowADInplaceOrView instead, If you are looking for a user facing API to enable running your inference-only workload, please use c10::InferenceMode. Using AutoDispatchBelowADInplaceOrView in user code is under risk of producing silent wrong result in some edge cases. See Note [AutoDispatchBelowAutograd] for more details. (Triggered internally at torch_npu/csrc/aten/common/TensorFactories.cpp:74.) rank_name_to_time[rank, i] = self._timers[name].elapsed(reset=reset) local_disk/cognitron_vl/third_party/Megatron-LM_core_r0.6.0/megatron/core/timers.py:238: UserWarning: AutoNonVariableTypeMode is deprecated and will be removed in 1.10 release. For kernel implementations please use AutoDispatchBelowADInplaceOrView instead, If you are looking for a user facing API to enable running your inference-only workload, please use c10::InferenceMode. Using AutoDispatchBelowADInplaceOrView in user code is under risk of producing silent wrong result in some edge cases. See Note [AutoDispatchBelowAutograd] for more details. (Triggered internally at torch_npu/csrc/aten/common/TensorFactories.cpp:74.) rank_name_to_time[rank, i] = self._timers[name].elapsed(reset=reset) local_disk/cognitron_vl/third_party/Megatron-LM_core_r0.6.0/megatron/core/timers.py:238: UserWarning: AutoNonVariableTypeMode is deprecated and will be removed in 1.10 release. For kernel implementations please use AutoDispatchBelowADInplaceOrView instead, If you are looking for a user facing API to enable running your inference-only workload, please use c10::InferenceMode. Using AutoDispatchBelowADInplaceOrView in user code is under risk of producing silent wrong result in some edge cases. See Note [AutoDispatchBelowAutograd] for more details. (Triggered internally at torch_npu/csrc/aten/common/TensorFactories.cpp:74.) rank_name_to_time[rank, i] = self._timers[name].elapsed(reset=reset) local_disk/cognitron_vl/third_party/Megatron-LM_core_r0.6.0/megatron/core/timers.py:238: UserWarning: AutoNonVariableTypeMode is deprecated and will be removed in 1.10 release. For kernel implementations please use AutoDispatchBelowADInplaceOrView instead, If you are looking for a user facing API to enable running your inference-only workload, please use c10::InferenceMode. Using AutoDispatchBelowADInplaceOrView in user code is under risk of producing silent wrong result in some edge cases. See Note [AutoDispatchBelowAutograd] for more details. (Triggered internally at torch_npu/csrc/aten/common/TensorFactories.cpp:74.) rank_name_to_time[rank, i] = self._timers[name].elapsed(reset=reset) /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages/torch/distributed/distributed_c10d.py:2927: UserWarning: torch.distributed._all_gather_base is a private function and will be deprecated. Please use torch.distributed.all_gather_into_tensor instead. warnings.warn( /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages/torch/distributed/distributed_c10d.py:2927: UserWarning: torch.distributed._all_gather_base is a private function and will be deprecated. Please use torch.distributed.all_gather_into_tensor instead. warnings.warn( /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages/torch/distributed/distributed_c10d.py:2927: UserWarning: torch.distributed._all_gather_base is a private function and will be deprecated. Please use torch.distributed.all_gather_into_tensor instead. warnings.warn( /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages/torch/distributed/distributed_c10d.py:2927: UserWarning: torch.distributed._all_gather_base is a private function and will be deprecated. Please use torch.distributed.all_gather_into_tensor instead. warnings.warn( /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages/torch/distributed/distributed_c10d.py:2927: UserWarning: torch.distributed._all_gather_base is a private function and will be deprecated. Please use torch.distributed.all_gather_into_tensor instead. warnings.warn( /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages/torch/distributed/distributed_c10d.py:2927: UserWarning: torch.distributed._all_gather_base is a private function and will be deprecated. Please use torch.distributed.all_gather_into_tensor instead. warnings.warn( /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages/torch/distributed/distributed_c10d.py:2927: UserWarning: torch.distributed._all_gather_base is a private function and will be deprecated. Please use torch.distributed.all_gather_into_tensor instead. warnings.warn( /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages/torch/distributed/distributed_c10d.py:2927: UserWarning: torch.distributed._all_gather_base is a private function and will be deprecated. Please use torch.distributed.all_gather_into_tensor instead. warnings.warn( /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages/torch/distributed/distributed_c10d.py:2927: UserWarning: torch.distributed._all_gather_base is a private function and will be deprecated. Please use torch.distributed.all_gather_into_tensor instead. warnings.warn( /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages/torch/distributed/distributed_c10d.py:2927: UserWarning: torch.distributed._all_gather_base is a private function and will be deprecated. Please use torch.distributed.all_gather_into_tensor instead. warnings.warn( /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages/torch/distributed/distributed_c10d.py:2927: UserWarning: torch.distributed._all_gather_base is a private function and will be deprecated. Please use torch.distributed.all_gather_into_tensor instead. warnings.warn( /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages/torch/distributed/distributed_c10d.py:2927: UserWarning: torch.distributed._all_gather_base is a private function and will be deprecated. Please use torch.distributed.all_gather_into_tensor instead. warnings.warn( /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages/torch/distributed/distributed_c10d.py:2927: UserWarning: torch.distributed._all_gather_base is a private function and will be deprecated. Please use torch.distributed.all_gather_into_tensor instead. warnings.warn( /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages/torch/distributed/distributed_c10d.py:2927: UserWarning: torch.distributed._all_gather_base is a private function and will be deprecated. Please use torch.distributed.all_gather_into_tensor instead. warnings.warn( /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages/torch/distributed/distributed_c10d.py:2927: UserWarning: torch.distributed._all_gather_base is a private function and will be deprecated. Please use torch.distributed.all_gather_into_tensor instead. warnings.warn( /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages/torch/distributed/distributed_c10d.py:2927: UserWarning: torch.distributed._all_gather_base is a private function and will be deprecated. Please use torch.distributed.all_gather_into_tensor instead. warnings.warn( > rank 153 does not create GPT datasets ... > rank 146 does not create GPT datasets ... > rank 147 does not create GPT datasets ... > rank 157 does not create GPT datasets ... > rank 152 is creating GPT datasets ... > rank 145 does not create GPT datasets ... > rank 150 does not create GPT datasets ... > rank 154 does not create GPT datasets ... > rank 155 does not create GPT datasets ... > rank 156 does not create GPT datasets ... > rank 159 does not create GPT datasets ... > rank 151 does not create GPT datasets ... > rank 149 does not create GPT datasets ... > rank 144 is creating GPT datasets ... > rank 158 does not create GPT datasets ... > rank 148 does not create GPT datasets ... target_ratios [(1, 1), (1, 2), (2, 1), (3, 1), (1, 3), (2, 2), (4, 1), (1, 4), (5, 1), (1, 5), (1, 6), (6, 1), (3, 2), (2, 3), (7, 1), (1, 7), (4, 2), (2, 4), (1, 8), (8, 1), (1, 9), (3, 3), (9, 1), (2, 5), (5, 2), (10, 1), (1, 10), (11, 1), (1, 11), (12, 1), (3, 4), (4, 3), (1, 12), (6, 2), (2, 6)] possible_resolutions [[448, 448], [448, 896], [896, 448], [1344, 448], [448, 1344], [896, 896], [1792, 448], [448, 1792], [2240, 448], [448, 2240], [448, 2688], [2688, 448], [1344, 896], [896, 1344], [3136, 448], [448, 3136], [1792, 896], [896, 1792], [448, 3584], [3584, 448], [448, 4032], [1344, 1344], [4032, 448], [896, 2240], [2240, 896], [4480, 448], [448, 4480], [4928, 448], [448, 4928], [5376, 448], [1344, 1792], [1792, 1344], [448, 5376], [2688, 896], [896, 2688]] target_ratios [(1, 1), (1, 2), (2, 1), (3, 1), (1, 3), (2, 2), (4, 1), (1, 4), (5, 1), (1, 5), (1, 6), (6, 1), (3, 2), (2, 3), (7, 1), (1, 7), (4, 2), (2, 4), (1, 8), (8, 1), (1, 9), (3, 3), (9, 1), (2, 5), (5, 2), (10, 1), (1, 10), (11, 1), (1, 11), (12, 1), (3, 4), (4, 3), (1, 12), (6, 2), (2, 6)] possible_resolutions [[448, 448], [448, 896], [896, 448], [1344, 448], [448, 1344], [896, 896], [1792, 448], [448, 1792], [2240, 448], [448, 2240], [448, 2688], [2688, 448], [1344, 896], [896, 1344], [3136, 448], [448, 3136], [1792, 896], [896, 1792], [448, 3584], [3584, 448], [448, 4032], [1344, 1344], [4032, 448], [896, 2240], [2240, 896], [4480, 448], [448, 4480], [4928, 448], [448, 4928], [5376, 448], [1344, 1792], [1792, 1344], [448, 5376], [2688, 896], [896, 2688]] /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages/torch_npu/utils/storage.py:38: UserWarning: TypedStorage is deprecated. It will be removed in the future and UntypedStorage will be the only storage class. This should only matter to you if you are using storages directly. To access UntypedStorage directly, use tensor.untyped_storage() instead of tensor.storage() if self.device.type != 'cpu': /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages/torch_npu/utils/storage.py:38: UserWarning: TypedStorage is deprecated. It will be removed in the future and UntypedStorage will be the only storage class. This should only matter to you if you are using storages directly. To access UntypedStorage directly, use tensor.untyped_storage() instead of tensor.storage() if self.device.type != 'cpu': /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages/torch_npu/utils/storage.py:38: UserWarning: TypedStorage is deprecated. It will be removed in the future and UntypedStorage will be the only storage class. This should only matter to you if you are using storages directly. To access UntypedStorage directly, use tensor.untyped_storage() instead of tensor.storage() if self.device.type != 'cpu': Warning: Device do not support double dtype now, dtype cast repalce with float. Warning: Device do not support double dtype now, dtype cast repalce with float. Warning: Device do not support double dtype now, dtype cast repalce with float. Warning: Device do not support double dtype now, dtype cast repalce with float. Warning: Device do not support double dtype now, dtype cast repalce with float. Warning: Device do not support double dtype now, dtype cast repalce with float. Warning: Device do not support double dtype now, dtype cast repalce with float. Warning: Device do not support double dtype now, dtype cast repalce with float. Warning: Device do not support double dtype now, dtype cast repalce with float. Warning: Device do not support double dtype now, dtype cast repalce with float. Warning: Device do not support double dtype now, dtype cast repalce with float. Warning: Device do not support double dtype now, dtype cast repalce with float. Warning: Device do not support double dtype now, dtype cast repalce with float. Warning: Device do not support double dtype now, dtype cast repalce with float. Warning: Device do not support double dtype now, dtype cast repalce with float. Warning: Device do not support double dtype now, dtype cast repalce with float. /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages/torch/distributed/distributed_c10d.py:2927: UserWarning: torch.distributed._all_gather_base is a private function and will be deprecated. Please use torch.distributed.all_gather_into_tensor instead. warnings.warn( /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages/torch/distributed/distributed_c10d.py:3403: UserWarning: torch.distributed._reduce_scatter_base is a private function and will be deprecated. Please use torch.distributed.reduce_scatter_tensor instead. warnings.warn( /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages/torch/distributed/distributed_c10d.py:2927: UserWarning: torch.distributed._all_gather_base is a private function and will be deprecated. Please use torch.distributed.all_gather_into_tensor instead. warnings.warn( /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages/torch/distributed/distributed_c10d.py:3403: UserWarning: torch.distributed._reduce_scatter_base is a private function and will be deprecated. Please use torch.distributed.reduce_scatter_tensor instead. warnings.warn( /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages/torch/distributed/distributed_c10d.py:2927: UserWarning: torch.distributed._all_gather_base is a private function and will be deprecated. Please use torch.distributed.all_gather_into_tensor instead. warnings.warn( /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages/torch/distributed/distributed_c10d.py:3403: UserWarning: torch.distributed._reduce_scatter_base is a private function and will be deprecated. Please use torch.distributed.reduce_scatter_tensor instead. warnings.warn( /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages/torch/distributed/distributed_c10d.py:2927: UserWarning: torch.distributed._all_gather_base is a private function and will be deprecated. Please use torch.distributed.all_gather_into_tensor instead. warnings.warn( /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages/torch/distributed/distributed_c10d.py:2927: UserWarning: torch.distributed._all_gather_base is a private function and will be deprecated. Please use torch.distributed.all_gather_into_tensor instead. warnings.warn( /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages/torch/distributed/distributed_c10d.py:3403: UserWarning: torch.distributed._reduce_scatter_base is a private function and will be deprecated. Please use torch.distributed.reduce_scatter_tensor instead. warnings.warn( /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages/torch/distributed/distributed_c10d.py:2927: UserWarning: torch.distributed._all_gather_base is a private function and will be deprecated. Please use torch.distributed.all_gather_into_tensor instead. warnings.warn( /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages/torch/distributed/distributed_c10d.py:2927: UserWarning: torch.distributed._all_gather_base is a private function and will be deprecated. Please use torch.distributed.all_gather_into_tensor instead. warnings.warn( /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages/torch/distributed/distributed_c10d.py:3403: UserWarning: torch.distributed._reduce_scatter_base is a private function and will be deprecated. Please use torch.distributed.reduce_scatter_tensor instead. warnings.warn( /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages/torch/distributed/distributed_c10d.py:3403: UserWarning: torch.distributed._reduce_scatter_base is a private function and will be deprecated. Please use torch.distributed.reduce_scatter_tensor instead. warnings.warn( /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages/torch/distributed/distributed_c10d.py:3403: UserWarning: torch.distributed._reduce_scatter_base is a private function and will be deprecated. Please use torch.distributed.reduce_scatter_tensor instead. warnings.warn( /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages/torch/distributed/distributed_c10d.py:2927: UserWarning: torch.distributed._all_gather_base is a private function and will be deprecated. Please use torch.distributed.all_gather_into_tensor instead. warnings.warn( /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages/torch/distributed/distributed_c10d.py:3403: UserWarning: torch.distributed._reduce_scatter_base is a private function and will be deprecated. Please use torch.distributed.reduce_scatter_tensor instead. warnings.warn( /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages/torch/distributed/distributed_c10d.py:2927: UserWarning: torch.distributed._all_gather_base is a private function and will be deprecated. Please use torch.distributed.all_gather_into_tensor instead. warnings.warn( /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages/torch/distributed/distributed_c10d.py:3403: UserWarning: torch.distributed._reduce_scatter_base is a private function and will be deprecated. Please use torch.distributed.reduce_scatter_tensor instead. warnings.warn( /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages/torch/distributed/distributed_c10d.py:2927: UserWarning: torch.distributed._all_gather_base is a private function and will be deprecated. Please use torch.distributed.all_gather_into_tensor instead. warnings.warn( /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages/torch/distributed/distributed_c10d.py:2927: UserWarning: torch.distributed._all_gather_base is a private function and will be deprecated. Please use torch.distributed.all_gather_into_tensor instead. warnings.warn( /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages/torch/distributed/distributed_c10d.py:2927: UserWarning: torch.distributed._all_gather_base is a private function and will be deprecated. Please use torch.distributed.all_gather_into_tensor instead. warnings.warn( /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages/torch/distributed/distributed_c10d.py:2927: UserWarning: torch.distributed._all_gather_base is a private function and will be deprecated. Please use torch.distributed.all_gather_into_tensor instead. warnings.warn( /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages/torch/distributed/distributed_c10d.py:3403: UserWarning: torch.distributed._reduce_scatter_base is a private function and will be deprecated. Please use torch.distributed.reduce_scatter_tensor instead. warnings.warn( /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages/torch/distributed/distributed_c10d.py:3403: UserWarning: torch.distributed._reduce_scatter_base is a private function and will be deprecated. Please use torch.distributed.reduce_scatter_tensor instead. warnings.warn( /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages/torch/distributed/distributed_c10d.py:3403: UserWarning: torch.distributed._reduce_scatter_base is a private function and will be deprecated. Please use torch.distributed.reduce_scatter_tensor instead. warnings.warn( /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages/torch/distributed/distributed_c10d.py:2927: UserWarning: torch.distributed._all_gather_base is a private function and will be deprecated. Please use torch.distributed.all_gather_into_tensor instead. warnings.warn( /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages/torch/distributed/distributed_c10d.py:2927: UserWarning: torch.distributed._all_gather_base is a private function and will be deprecated. Please use torch.distributed.all_gather_into_tensor instead. warnings.warn( /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages/torch/distributed/distributed_c10d.py:3403: UserWarning: torch.distributed._reduce_scatter_base is a private function and will be deprecated. Please use torch.distributed.reduce_scatter_tensor instead. warnings.warn( /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages/torch/distributed/distributed_c10d.py:3403: UserWarning: torch.distributed._reduce_scatter_base is a private function and will be deprecated. Please use torch.distributed.reduce_scatter_tensor instead. warnings.warn( /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages/torch/distributed/distributed_c10d.py:3403: UserWarning: torch.distributed._reduce_scatter_base is a private function and will be deprecated. Please use torch.distributed.reduce_scatter_tensor instead. warnings.warn( /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages/torch/distributed/distributed_c10d.py:2927: UserWarning: torch.distributed._all_gather_base is a private function and will be deprecated. Please use torch.distributed.all_gather_into_tensor instead. warnings.warn( /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages/torch/distributed/distributed_c10d.py:3403: UserWarning: torch.distributed._reduce_scatter_base is a private function and will be deprecated. Please use torch.distributed.reduce_scatter_tensor instead. warnings.warn( - - - - - - - - - - - - - - - - \ \ \ \ \ \ \ \ \ \ \ \ \ \ \ \ | | | | | | | | | | | | | | | | / / / / / / / / / / / / / / / / /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages/torch_npu/utils/storage.py:38: UserWarning: TypedStorage is deprecated. It will be removed in the future and UntypedStorage will be the only storage class. This should only matter to you if you are using storages directly. To access UntypedStorage directly, use tensor.untyped_storage() instead of tensor.storage() if self.device.type != 'cpu': - - - - - - - - - - - - - - - - /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages/torch_npu/utils/storage.py:38: UserWarning: TypedStorage is deprecated. It will be removed in the future and UntypedStorage will be the only storage class. This should only matter to you if you are using storages directly. To access UntypedStorage directly, use tensor.untyped_storage() instead of tensor.storage() if self.device.type != 'cpu': /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages/torch_npu/utils/storage.py:38: UserWarning: TypedStorage is deprecated. It will be removed in the future and UntypedStorage will be the only storage class. This should only matter to you if you are using storages directly. To access UntypedStorage directly, use tensor.untyped_storage() instead of tensor.storage() if self.device.type != 'cpu': /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages/torch_npu/utils/storage.py:38: UserWarning: TypedStorage is deprecated. It will be removed in the future and UntypedStorage will be the only storage class. This should only matter to you if you are using storages directly. To access UntypedStorage directly, use tensor.untyped_storage() instead of tensor.storage() if self.device.type != 'cpu': /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages/torch_npu/utils/storage.py:38: UserWarning: TypedStorage is deprecated. It will be removed in the future and UntypedStorage will be the only storage class. This should only matter to you if you are using storages directly. To access UntypedStorage directly, use tensor.untyped_storage() instead of tensor.storage() if self.device.type != 'cpu': /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages/torch_npu/utils/storage.py:38: UserWarning: TypedStorage is deprecated. It will be removed in the future and UntypedStorage will be the only storage class. This should only matter to you if you are using storages directly. To access UntypedStorage directly, use tensor.untyped_storage() instead of tensor.storage() if self.device.type != 'cpu': /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages/torch_npu/utils/storage.py:38: UserWarning: TypedStorage is deprecated. It will be removed in the future and UntypedStorage will be the only storage class. This should only matter to you if you are using storages directly. To access UntypedStorage directly, use tensor.untyped_storage() instead of tensor.storage() if self.device.type != 'cpu': /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages/torch_npu/utils/storage.py:38: UserWarning: TypedStorage is deprecated. It will be removed in the future and UntypedStorage will be the only storage class. This should only matter to you if you are using storages directly. To access UntypedStorage directly, use tensor.untyped_storage() instead of tensor.storage() if self.device.type != 'cpu': /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages/torch_npu/utils/storage.py:38: UserWarning: TypedStorage is deprecated. It will be removed in the future and UntypedStorage will be the only storage class. This should only matter to you if you are using storages directly. To access UntypedStorage directly, use tensor.untyped_storage() instead of tensor.storage() if self.device.type != 'cpu': /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages/torch_npu/utils/storage.py:38: UserWarning: TypedStorage is deprecated. It will be removed in the future and UntypedStorage will be the only storage class. This should only matter to you if you are using storages directly. To access UntypedStorage directly, use tensor.untyped_storage() instead of tensor.storage() if self.device.type != 'cpu': /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages/torch_npu/utils/storage.py:38: UserWarning: TypedStorage is deprecated. It will be removed in the future and UntypedStorage will be the only storage class. This should only matter to you if you are using storages directly. To access UntypedStorage directly, use tensor.untyped_storage() instead of tensor.storage() if self.device.type != 'cpu': /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages/torch_npu/utils/storage.py:38: UserWarning: TypedStorage is deprecated. It will be removed in the future and UntypedStorage will be the only storage class. This should only matter to you if you are using storages directly. To access UntypedStorage directly, use tensor.untyped_storage() instead of tensor.storage() if self.device.type != 'cpu': /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages/torch_npu/utils/storage.py:38: UserWarning: TypedStorage is deprecated. It will be removed in the future and UntypedStorage will be the only storage class. This should only matter to you if you are using storages directly. To access UntypedStorage directly, use tensor.untyped_storage() instead of tensor.storage() if self.device.type != 'cpu': \ \ \ \ \ \ \ \ \ \ \ \ \ \ \ \ Token indices sequence length is longer than the specified maximum sequence length for this model (87438 > 16384). Running this sequence through the model will result in indexing errors Token indices sequence length is longer than the specified maximum sequence length for this model (30016 > 16384). Running this sequence through the model will result in indexing errors Token indices sequence length is longer than the specified maximum sequence length for this model (26200 > 16384). Running this sequence through the model will result in indexing errors Token indices sequence length is longer than the specified maximum sequence length for this model (19703 > 16384). Running this sequence through the model will result in indexing errors local_disk/cognitron_vl/cognitron_vl/data/processor/image_processor.py:240: ResourceWarning: unclosed file <_io.BufferedReader name='datasets/LMM/lmms-lab/LLaVA-OneVision-Data/cambrian(filtered)/cambrian_selection/web-landmark_images_Golden_Temple.jpg'> image = Image.open(img_or_path).convert("RGB") ResourceWarning: Enable tracemalloc to get the object allocation traceback processed_samples 10195 unjoint_samples 10000 processed_samples 10197 unjoint_samples 10000 processed_samples 10201 unjoint_samples 10000 processed_samples 10219 unjoint_samples 10000 processed_samples 10222 unjoint_samples 10000 processed_samples 10225 unjoint_samples 10000 processed_samples 10228 unjoint_samples 10000 processed_samples 10234 unjoint_samples 10000 processed_samples 10164 unjoint_samples 10000 processed_samples 10197 unjoint_samples 10000 processed_samples 10206 unjoint_samples 10000 processed_samples 10212 unjoint_samples 10000 processed_samples 10222 unjoint_samples 10000 processed_samples 10225 unjoint_samples 10000 processed_samples 10224 unjoint_samples 10000 processed_samples 10239 unjoint_samples 10000 local_disk/cognitron_vl/cognitron_vl/data/processor/image_processor.py:240: ResourceWarning: unclosed file <_io.BufferedReader name='datasets/LMM/lmms-lab/LLaVA-OneVision-Data/cambrian(filtered)/cambrian_selection/web-landmark_images_Golden_Temple.jpg'> image = Image.open(img_or_path).convert("RGB") ResourceWarning: Enable tracemalloc to get the object allocation traceback Token indices sequence length is longer than the specified maximum sequence length for this model (84959 > 16384). Running this sequence through the model will result in indexing errors local_disk/cognitron_vl/cognitron_vl/data/processor/image_processor.py:240: ResourceWarning: unclosed file <_io.BufferedReader name='datasets/LMM/lmms-lab/M4-Instruct-Data/mmchat/images/mw2048_7d6c8b50ly1fgwo1va92zj20hs1827ie.jpg'> image = Image.open(img_or_path).convert("RGB") ResourceWarning: Enable tracemalloc to get the object allocation traceback local_disk/cognitron_vl/cognitron_vl/data/processor/image_processor.py:240: ResourceWarning: unclosed file <_io.BufferedReader name='datasets/LMM/lmms-lab/M4-Instruct-Data/imagecode/0.0.0/c55fcb268ead378049e4743c77ca2db3142e12a0f7dfc42eb8267e08efa85f58/train_images/image-sets/open-images-1858_b25543cdaa25a08a/img4.jpg'> image = Image.open(img_or_path).convert("RGB") ResourceWarning: Enable tracemalloc to get the object allocation traceback /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages/PIL/TiffImagePlugin.py:870: UserWarning: Truncated File Read warnings.warn(str(msg)) /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages/PIL/TiffImagePlugin.py:870: UserWarning: Truncated File Read warnings.warn(str(msg)) processed_samples 20392 unjoint_samples 20000 processed_samples 20398 unjoint_samples 20000 processed_samples 20412 unjoint_samples 20000 processed_samples 20421 unjoint_samples 20000 processed_samples 20427 unjoint_samples 20000 processed_samples 20440 unjoint_samples 20000 processed_samples 20440 unjoint_samples 20000 processed_samples 20443 unjoint_samples 20000 processed_samples 20364 unjoint_samples 20000 processed_samples 20395 unjoint_samples 20000 processed_samples 20413 unjoint_samples 20000 processed_samples 20418 unjoint_samples 20000 processed_samples 20423 unjoint_samples 20000 processed_samples 20430 unjoint_samples 20000 processed_samples 20439 unjoint_samples 20000 processed_samples 20447 unjoint_samples 20000 Token indices sequence length is longer than the specified maximum sequence length for this model (36865 > 16384). Running this sequence through the model will result in indexing errors local_disk/cognitron_vl/cognitron_vl/data/processor/image_processor.py:240: ResourceWarning: unclosed file <_io.BufferedReader name='datasets/LMM/lmms-lab/M4-Instruct-Data/IEdit/full/images/6981.jpg'> image = Image.open(img_or_path).convert("RGB") ResourceWarning: Enable tracemalloc to get the object allocation traceback Token indices sequence length is longer than the specified maximum sequence length for this model (16395 > 16384). Running this sequence through the model will result in indexing errors local_disk/cognitron_vl/cognitron_vl/data/processor/image_processor.py:240: ResourceWarning: unclosed file <_io.BufferedReader name='datasets/LMM/Vision-Flan/vision-flan_191-task_1k/images_191task_1k/WIT+detailed_description_146_Vernonia_amygdalina_06.jpg'> image = Image.open(img_or_path).convert("RGB") ResourceWarning: Enable tracemalloc to get the object allocation traceback local_disk/cognitron_vl/cognitron_vl/data/processor/image_processor.py:240: ResourceWarning: unclosed file <_io.BufferedReader name='datasets/LMM/Vision-Flan/vision-flan_191-task_1k/images_191task_1k/WIT+detailed_description_265_9WymanWorcesterFront.JPG'> image = Image.open(img_or_path).convert("RGB") ResourceWarning: Enable tracemalloc to get the object allocation traceback processed_samples 30599 unjoint_samples 30000 processed_samples 30620 unjoint_samples 30000 processed_samples 30623 unjoint_samples 30000 processed_samples 30623 unjoint_samples 30000 processed_samples 30625 unjoint_samples 30000 processed_samples 30643 unjoint_samples 30000 processed_samples 30670 unjoint_samples 30000 processed_samples 30670 unjoint_samples 30000 processed_samples 30577 unjoint_samples 30000 processed_samples 30597 unjoint_samples 30000 processed_samples 30598 unjoint_samples 30000 processed_samples 30606 unjoint_samples 30000 processed_samples 30632 unjoint_samples 30000 processed_samples 30635 unjoint_samples 30000 processed_samples 30665 unjoint_samples 30000 processed_samples 30695 unjoint_samples 30000 /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages/PIL/TiffImagePlugin.py:870: UserWarning: Corrupt EXIF data. Expecting to read 4 bytes but only got 0. warnings.warn(str(msg)) /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages/PIL/TiffImagePlugin.py:870: UserWarning: Truncated File Read warnings.warn(str(msg)) Token indices sequence length is longer than the specified maximum sequence length for this model (329688 > 16384). Running this sequence through the model will result in indexing errors processed_samples 40810 unjoint_samples 40000 processed_samples 40832 unjoint_samples 40000 processed_samples 40838 unjoint_samples 40000 processed_samples 40839 unjoint_samples 40000 processed_samples 40845 unjoint_samples 40000 processed_samples 40852 unjoint_samples 40000 processed_samples 40882 unjoint_samples 40000 processed_samples 40894 unjoint_samples 40000 processed_samples 40779 unjoint_samples 40000 processed_samples 40785 unjoint_samples 40000 processed_samples 40805 unjoint_samples 40000 processed_samples 40809 unjoint_samples 40000 processed_samples 40837 unjoint_samples 40000 processed_samples 40845 unjoint_samples 40000 processed_samples 40876 unjoint_samples 40000 processed_samples 40895 unjoint_samples 40000 local_disk/cognitron_vl/cognitron_vl/data/processor/image_processor.py:240: ResourceWarning: unclosed file <_io.BufferedReader name='datasets/LMM/lmms-lab/LLaVA-OneVision-Mid-Data/ureader-instruction-1.0/TextCaps/train_images/21d60e0822064acb.jpg'> image = Image.open(img_or_path).convert("RGB") ResourceWarning: Enable tracemalloc to get the object allocation traceback local_disk/cognitron_vl/cognitron_vl/data/processor/image_processor.py:240: ResourceWarning: unclosed file <_io.BufferedReader name='datasets/LMM/lmms-lab/M4-Instruct-Data/mmchat/images/mw2048_6f89c732gy1ff360nro89j20hs160ae9.jpg'> image = Image.open(img_or_path).convert("RGB") ResourceWarning: Enable tracemalloc to get the object allocation traceback local_disk/cognitron_vl/cognitron_vl/data/processor/image_processor.py:240: ResourceWarning: unclosed file <_io.BufferedReader name='datasets/LMM/lmms-lab/M4-Instruct-Data/mmchat/images/mw2048_6f89c732gy1ff360o7hp0j20go0b4ab6.jpg'> image = Image.open(img_or_path).convert("RGB") ResourceWarning: Enable tracemalloc to get the object allocation traceback Token indices sequence length is longer than the specified maximum sequence length for this model (21141 > 16384). Running this sequence through the model will result in indexing errors processed_samples 51014 unjoint_samples 50000 processed_samples 51021 unjoint_samples 50000 processed_samples 51031 unjoint_samples 50000 processed_samples 51065 unjoint_samples 50000 processed_samples 51069 unjoint_samples 50000 processed_samples 51081 unjoint_samples 50000 processed_samples 51086 unjoint_samples 50000 processed_samples 50982 unjoint_samples 50000 processed_samples 50994 unjoint_samples 50000 processed_samples 51128 unjoint_samples 50000 processed_samples 51012 unjoint_samples 50000 processed_samples 51017 unjoint_samples 50000 processed_samples 51023 unjoint_samples 50000 processed_samples 51066 unjoint_samples 50000 processed_samples 51093 unjoint_samples 50000 processed_samples 51099 unjoint_samples 50000 Token indices sequence length is longer than the specified maximum sequence length for this model (469971 > 16384). Running this sequence through the model will result in indexing errors local_disk/cognitron_vl/cognitron_vl/data/processor/image_processor.py:240: ResourceWarning: unclosed file <_io.BufferedReader name='datasets/LMM/lmms-lab/M4-Instruct-Data/OCR-VQA/full/images/358.jpg'> image = Image.open(img_or_path).convert("RGB") ResourceWarning: Enable tracemalloc to get the object allocation traceback Token indices sequence length is longer than the specified maximum sequence length for this model (120348 > 16384). Running this sequence through the model will result in indexing errors processed_samples 61209 unjoint_samples 60000 processed_samples 61222 unjoint_samples 60000 processed_samples 61238 unjoint_samples 60000 processed_samples 61239 unjoint_samples 60000 processed_samples 61274 unjoint_samples 60000 processed_samples 61283 unjoint_samples 60000 processed_samples 61292 unjoint_samples 60000 processed_samples 61382 unjoint_samples 60000 processed_samples 61215 unjoint_samples 60000 processed_samples 61217 unjoint_samples 60000 processed_samples 61219 unjoint_samples 60000 processed_samples 61257 unjoint_samples 60000 processed_samples 61261 unjoint_samples 60000 processed_samples 61271 unjoint_samples 60000 processed_samples 61286 unjoint_samples 60000 processed_samples 61295 unjoint_samples 60000 Token indices sequence length is longer than the specified maximum sequence length for this model (83611 > 16384). Running this sequence through the model will result in indexing errors Token indices sequence length is longer than the specified maximum sequence length for this model (20727 > 16384). Running this sequence through the model will result in indexing errors processed_samples 71408 unjoint_samples 70000 processed_samples 71425 unjoint_samples 70000 processed_samples 71445 unjoint_samples 70000 processed_samples 71447 unjoint_samples 70000 processed_samples 71475 unjoint_samples 70000 processed_samples 71502 unjoint_samples 70000 processed_samples 71395 unjoint_samples 70000 processed_samples 71546 unjoint_samples 70000 processed_samples 71409 unjoint_samples 70000 processed_samples 71427 unjoint_samples 70000 processed_samples 71597 unjoint_samples 70000 processed_samples 71465 unjoint_samples 70000 processed_samples 71468 unjoint_samples 70000 processed_samples 71479 unjoint_samples 70000 processed_samples 71481 unjoint_samples 70000 processed_samples 71484 unjoint_samples 70000 Token indices sequence length is longer than the specified maximum sequence length for this model (141185 > 16384). Running this sequence through the model will result in indexing errors local_disk/cognitron_vl/cognitron_vl/data/processor/image_processor.py:240: ResourceWarning: unclosed file <_io.BufferedReader name='datasets/LMM/Vision-Flan/vision-flan_191-task_1k/images_191task_1k/Yoga-82+yoga_pose_recognition_979_P1060632.jpg'> image = Image.open(img_or_path).convert("RGB") ResourceWarning: Enable tracemalloc to get the object allocation traceback /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages/PIL/TiffImagePlugin.py:870: UserWarning: Corrupt EXIF data. Expecting to read 4 bytes but only got 0. warnings.warn(str(msg)) local_disk/cognitron_vl/cognitron_vl/data/processor/image_processor.py:240: ResourceWarning: unclosed file <_io.BufferedReader name='datasets/LMM/Vision-Flan/vision-flan_191-task_1k/images_191task_1k/WIT+detailed_description_585_Carl_II_of_Sweden%2C_Carl_I_of_Norway.jpg'> image = Image.open(img_or_path).convert("RGB") ResourceWarning: Enable tracemalloc to get the object allocation traceback /root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages/PIL/TiffImagePlugin.py:870: UserWarning: Corrupt EXIF data. Expecting to read 12 bytes but only got 10. warnings.warn(str(msg)) Traceback (most recent call last): File "/local_disk/cognitron_vl//lcvlm_modellink/pretrain_lcvlm.py", line 1054, in main() File "/local_disk/cognitron_vl//lcvlm_modellink/pretrain_lcvlm.py", line 1041, in main pretrain(train_valid_test_datasets_provider, File "local_disk/cognitron_vl/third_party/ModelLink/modellink/training/training.py", line 349, in pretrain iteration, num_floating_point_operations_so_far = train(*train_args) File "local_disk/cognitron_vl/third_party/ModelLink/modellink/training/training.py", line 493, in train train_step(forward_step_func, File "local_disk/cognitron_vl/third_party/Megatron-LM_core_r0.6.0/megatron/training/training.py", line 541, in train_step losses_reduced = forward_backward_func( File "local_disk/cognitron_vl/third_party/Megatron-LM_core_r0.6.0/megatron/core/pipeline_parallel/schedules.py", line 356, in forward_backward_no_pipelining output_tensor = forward_step( File "local_disk/cognitron_vl/third_party/Megatron-LM_core_r0.6.0/megatron/core/pipeline_parallel/schedules.py", line 192, in forward_step output_tensor, loss_func = forward_step_func(data_iterator, model) File "/local_disk/cognitron_vl//lcvlm_modellink/pretrain_lcvlm.py", line 863, in forward_step tokens, labels, loss_mask, attention_mask, position_ids, external_dict = get_batch( File "/local_disk/cognitron_vl//lcvlm_modellink/pretrain_lcvlm.py", line 706, in get_batch batch = get_batch_on_this_tp_rank(data_iterator) File "local_disk/cognitron_vl/lcvlm_modellink/training/utils.py", line 710, in get_batch_on_this_tp_rank data = next(data_iterator) File "/root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages/torch/utils/data/dataloader.py", line 630, in __next__ data = self._next_data() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages/torch/utils/data/dataloader.py", line 1318, in _next_data raise StopIteration StopIteration [2024-10-17 19:15:13,239] torch.distributed.elastic.multiprocessing.api: [WARNING] Sending process 1244 closing signal SIGTERM [2024-10-17 19:15:13,239] torch.distributed.elastic.multiprocessing.api: [WARNING] Sending process 1245 closing signal SIGTERM [2024-10-17 19:15:13,239] torch.distributed.elastic.multiprocessing.api: [WARNING] Sending process 1246 closing signal SIGTERM [2024-10-17 19:15:13,239] torch.distributed.elastic.multiprocessing.api: [WARNING] Sending process 1247 closing signal SIGTERM [2024-10-17 19:15:13,239] torch.distributed.elastic.multiprocessing.api: [WARNING] Sending process 1248 closing signal SIGTERM [2024-10-17 19:15:13,239] torch.distributed.elastic.multiprocessing.api: [WARNING] Sending process 1249 closing signal SIGTERM [2024-10-17 19:15:13,239] torch.distributed.elastic.multiprocessing.api: [WARNING] Sending process 1250 closing signal SIGTERM [2024-10-17 19:15:13,240] torch.distributed.elastic.multiprocessing.api: [WARNING] Sending process 1251 closing signal SIGTERM [2024-10-17 19:15:13,240] torch.distributed.elastic.multiprocessing.api: [WARNING] Sending process 1253 closing signal SIGTERM [2024-10-17 19:15:13,240] torch.distributed.elastic.multiprocessing.api: [WARNING] Sending process 1254 closing signal SIGTERM [2024-10-17 19:15:13,240] torch.distributed.elastic.multiprocessing.api: [WARNING] Sending process 1256 closing signal SIGTERM [2024-10-17 19:15:13,240] torch.distributed.elastic.multiprocessing.api: [WARNING] Sending process 1258 closing signal SIGTERM [2024-10-17 19:15:13,240] torch.distributed.elastic.multiprocessing.api: [WARNING] Sending process 1259 closing signal SIGTERM [2024-10-17 19:15:13,240] torch.distributed.elastic.multiprocessing.api: [WARNING] Sending process 1261 closing signal SIGTERM [2024-10-17 19:15:13,240] torch.distributed.elastic.multiprocessing.api: [WARNING] Sending process 1263 closing signal SIGTERM Process ForkServerProcess-5: Traceback (most recent call last): File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 313, in _bootstrap self.run() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 108, in run self._target(*self._args, **self._kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 65, in wrapper raise exp File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 62, in wrapper func(*args, **kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 262, in task_distribute key, func_name, detail = resource_proxy[TASK_QUEUE].get() File "", line 2, in get File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/managers.py", line 835, in _callmethod kind, result = conn.recv() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 250, in recv buf = self._recv_bytes() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 414, in _recv_bytes buf = self._recv(4) File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 383, in _recv raise EOFError EOFError Process ForkServerProcess-7: Traceback (most recent call last): File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 313, in _bootstrap self.run() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 108, in run self._target(*self._args, **self._kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 65, in wrapper raise exp File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 62, in wrapper func(*args, **kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 262, in task_distribute key, func_name, detail = resource_proxy[TASK_QUEUE].get() File "", line 2, in get File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/managers.py", line 835, in _callmethod kind, result = conn.recv() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 250, in recv buf = self._recv_bytes() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 414, in _recv_bytes buf = self._recv(4) File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 383, in _recv raise EOFError EOFError Process ForkServerProcess-3: Traceback (most recent call last): File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 313, in _bootstrap self.run() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 108, in run self._target(*self._args, **self._kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 65, in wrapper raise exp File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 62, in wrapper func(*args, **kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 262, in task_distribute key, func_name, detail = resource_proxy[TASK_QUEUE].get() File "", line 2, in get File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/managers.py", line 835, in _callmethod kind, result = conn.recv() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 250, in recv buf = self._recv_bytes() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 414, in _recv_bytes buf = self._recv(4) File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 383, in _recv raise EOFError EOFError Process ForkServerProcess-8: Traceback (most recent call last): File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 313, in _bootstrap self.run() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 108, in run self._target(*self._args, **self._kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 65, in wrapper raise exp File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 62, in wrapper func(*args, **kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 262, in task_distribute key, func_name, detail = resource_proxy[TASK_QUEUE].get() File "", line 2, in get File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/managers.py", line 835, in _callmethod kind, result = conn.recv() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 250, in recv buf = self._recv_bytes() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 414, in _recv_bytes buf = self._recv(4) File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 383, in _recv raise EOFError EOFError Process ForkServerProcess-6: Traceback (most recent call last): File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 313, in _bootstrap self.run() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 108, in run self._target(*self._args, **self._kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 65, in wrapper raise exp File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 62, in wrapper func(*args, **kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 262, in task_distribute key, func_name, detail = resource_proxy[TASK_QUEUE].get() File "", line 2, in get File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/managers.py", line 835, in _callmethod kind, result = conn.recv() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 250, in recv buf = self._recv_bytes() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 414, in _recv_bytes buf = self._recv(4) File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 383, in _recv raise EOFError EOFError Process ForkServerProcess-9: Traceback (most recent call last): File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 313, in _bootstrap self.run() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 108, in run self._target(*self._args, **self._kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 65, in wrapper raise exp File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 62, in wrapper func(*args, **kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 262, in task_distribute key, func_name, detail = resource_proxy[TASK_QUEUE].get() File "", line 2, in get File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/managers.py", line 835, in _callmethod kind, result = conn.recv() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 250, in recv buf = self._recv_bytes() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 414, in _recv_bytes buf = self._recv(4) File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 383, in _recv raise EOFError EOFError Process ForkServerProcess-2: Traceback (most recent call last): File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 313, in _bootstrap self.run() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 108, in run self._target(*self._args, **self._kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 65, in wrapper raise exp File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 62, in wrapper func(*args, **kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 262, in task_distribute key, func_name, detail = resource_proxy[TASK_QUEUE].get() File "", line 2, in get File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/managers.py", line 835, in _callmethod kind, result = conn.recv() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 250, in recv buf = self._recv_bytes() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 414, in _recv_bytes buf = self._recv(4) File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 383, in _recv raise EOFError EOFError Process ForkServerProcess-4: Traceback (most recent call last): File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 313, in _bootstrap self.run() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 108, in run self._target(*self._args, **self._kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 65, in wrapper raise exp File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 62, in wrapper func(*args, **kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 262, in task_distribute key, func_name, detail = resource_proxy[TASK_QUEUE].get() File "", line 2, in get File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/managers.py", line 835, in _callmethod kind, result = conn.recv() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 250, in recv buf = self._recv_bytes() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 414, in _recv_bytes buf = self._recv(4) File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 383, in _recv raise EOFError EOFError Process ForkServerProcess-9: Traceback (most recent call last): File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 313, in _bootstrap self.run() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 108, in run self._target(*self._args, **self._kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 65, in wrapper raise exp File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 62, in wrapper func(*args, **kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 262, in task_distribute key, func_name, detail = resource_proxy[TASK_QUEUE].get() File "", line 2, in get File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/managers.py", line 835, in _callmethod kind, result = conn.recv() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 250, in recv buf = self._recv_bytes() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 414, in _recv_bytes buf = self._recv(4) File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 383, in _recv raise EOFError EOFError Process ForkServerProcess-5: Traceback (most recent call last): File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 313, in _bootstrap self.run() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 108, in run self._target(*self._args, **self._kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 65, in wrapper raise exp File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 62, in wrapper func(*args, **kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 262, in task_distribute key, func_name, detail = resource_proxy[TASK_QUEUE].get() File "", line 2, in get File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/managers.py", line 835, in _callmethod kind, result = conn.recv() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 250, in recv buf = self._recv_bytes() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 414, in _recv_bytes buf = self._recv(4) File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 383, in _recv raise EOFError EOFError Process ForkServerProcess-7: Traceback (most recent call last): File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 313, in _bootstrap self.run() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 108, in run self._target(*self._args, **self._kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 65, in wrapper raise exp File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 62, in wrapper func(*args, **kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 262, in task_distribute key, func_name, detail = resource_proxy[TASK_QUEUE].get() File "", line 2, in get File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/managers.py", line 835, in _callmethod kind, result = conn.recv() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 250, in recv buf = self._recv_bytes() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 414, in _recv_bytes buf = self._recv(4) File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 383, in _recv raise EOFError EOFError Process ForkServerProcess-2: Traceback (most recent call last): File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 313, in _bootstrap self.run() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 108, in run self._target(*self._args, **self._kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 65, in wrapper raise exp File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 62, in wrapper func(*args, **kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 262, in task_distribute key, func_name, detail = resource_proxy[TASK_QUEUE].get() File "", line 2, in get File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/managers.py", line 835, in _callmethod kind, result = conn.recv() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 250, in recv buf = self._recv_bytes() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 414, in _recv_bytes buf = self._recv(4) File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 383, in _recv raise EOFError EOFError Process ForkServerProcess-8: Traceback (most recent call last): File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 313, in _bootstrap self.run() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 108, in run self._target(*self._args, **self._kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 65, in wrapper raise exp File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 62, in wrapper func(*args, **kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 262, in task_distribute key, func_name, detail = resource_proxy[TASK_QUEUE].get() File "", line 2, in get File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/managers.py", line 835, in _callmethod kind, result = conn.recv() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 250, in recv buf = self._recv_bytes() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 414, in _recv_bytes buf = self._recv(4) File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 383, in _recv raise EOFError EOFError Process ForkServerProcess-3: Traceback (most recent call last): File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 313, in _bootstrap self.run() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 108, in run self._target(*self._args, **self._kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 65, in wrapper raise exp File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 62, in wrapper func(*args, **kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 262, in task_distribute key, func_name, detail = resource_proxy[TASK_QUEUE].get() File "", line 2, in get File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/managers.py", line 835, in _callmethod kind, result = conn.recv() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 250, in recv buf = self._recv_bytes() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 414, in _recv_bytes buf = self._recv(4) File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 383, in _recv raise EOFError EOFError Process ForkServerProcess-6: Traceback (most recent call last): File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 313, in _bootstrap self.run() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 108, in run self._target(*self._args, **self._kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 65, in wrapper raise exp File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 62, in wrapper func(*args, **kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 262, in task_distribute key, func_name, detail = resource_proxy[TASK_QUEUE].get() File "", line 2, in get File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/managers.py", line 835, in _callmethod kind, result = conn.recv() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 250, in recv buf = self._recv_bytes() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 414, in _recv_bytes buf = self._recv(4) File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 383, in _recv raise EOFError EOFError Process ForkServerProcess-4: Traceback (most recent call last): File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 313, in _bootstrap self.run() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 108, in run self._target(*self._args, **self._kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 65, in wrapper raise exp File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 62, in wrapper func(*args, **kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 262, in task_distribute key, func_name, detail = resource_proxy[TASK_QUEUE].get() File "", line 2, in get File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/managers.py", line 835, in _callmethod kind, result = conn.recv() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 250, in recv buf = self._recv_bytes() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 414, in _recv_bytes buf = self._recv(4) File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 383, in _recv raise EOFError EOFError Process ForkServerProcess-8: Traceback (most recent call last): File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 313, in _bootstrap self.run() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 108, in run self._target(*self._args, **self._kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 65, in wrapper raise exp File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 62, in wrapper func(*args, **kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 262, in task_distribute key, func_name, detail = resource_proxy[TASK_QUEUE].get() File "", line 2, in get File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/managers.py", line 835, in _callmethod kind, result = conn.recv() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 250, in recv buf = self._recv_bytes() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 414, in _recv_bytes buf = self._recv(4) File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 383, in _recv raise EOFError EOFError Process ForkServerProcess-5: Traceback (most recent call last): File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 313, in _bootstrap self.run() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 108, in run self._target(*self._args, **self._kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 65, in wrapper raise exp File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 62, in wrapper func(*args, **kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 262, in task_distribute key, func_name, detail = resource_proxy[TASK_QUEUE].get() File "", line 2, in get File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/managers.py", line 835, in _callmethod kind, result = conn.recv() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 250, in recv buf = self._recv_bytes() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 414, in _recv_bytes buf = self._recv(4) File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 383, in _recv raise EOFError EOFError Process ForkServerProcess-7: Traceback (most recent call last): File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 313, in _bootstrap self.run() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 108, in run self._target(*self._args, **self._kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 65, in wrapper raise exp File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 62, in wrapper func(*args, **kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 262, in task_distribute key, func_name, detail = resource_proxy[TASK_QUEUE].get() File "", line 2, in get File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/managers.py", line 835, in _callmethod kind, result = conn.recv() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 250, in recv buf = self._recv_bytes() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 414, in _recv_bytes buf = self._recv(4) File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 383, in _recv raise EOFError EOFError Process ForkServerProcess-3: Traceback (most recent call last): File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 313, in _bootstrap self.run() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 108, in run self._target(*self._args, **self._kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 65, in wrapper raise exp File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 62, in wrapper func(*args, **kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 262, in task_distribute key, func_name, detail = resource_proxy[TASK_QUEUE].get() File "", line 2, in get File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/managers.py", line 835, in _callmethod kind, result = conn.recv() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 250, in recv buf = self._recv_bytes() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 414, in _recv_bytes buf = self._recv(4) File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 383, in _recv raise EOFError EOFError Process ForkServerProcess-9: Traceback (most recent call last): File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 313, in _bootstrap self.run() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 108, in run self._target(*self._args, **self._kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 65, in wrapper raise exp File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 62, in wrapper func(*args, **kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 262, in task_distribute key, func_name, detail = resource_proxy[TASK_QUEUE].get() File "", line 2, in get File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/managers.py", line 835, in _callmethod kind, result = conn.recv() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 250, in recv buf = self._recv_bytes() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 414, in _recv_bytes buf = self._recv(4) File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 383, in _recv raise EOFError EOFError Process ForkServerProcess-6: Traceback (most recent call last): File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 313, in _bootstrap self.run() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 108, in run self._target(*self._args, **self._kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 65, in wrapper raise exp File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 62, in wrapper func(*args, **kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 262, in task_distribute key, func_name, detail = resource_proxy[TASK_QUEUE].get() File "", line 2, in get File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/managers.py", line 835, in _callmethod kind, result = conn.recv() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 250, in recv buf = self._recv_bytes() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 414, in _recv_bytes buf = self._recv(4) File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 383, in _recv raise EOFError EOFError Process ForkServerProcess-4: Traceback (most recent call last): File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 313, in _bootstrap self.run() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 108, in run self._target(*self._args, **self._kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 65, in wrapper raise exp File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 62, in wrapper func(*args, **kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 262, in task_distribute key, func_name, detail = resource_proxy[TASK_QUEUE].get() File "", line 2, in get File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/managers.py", line 835, in _callmethod kind, result = conn.recv() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 250, in recv buf = self._recv_bytes() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 414, in _recv_bytes buf = self._recv(4) File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 383, in _recv raise EOFError EOFError Process ForkServerProcess-2: Traceback (most recent call last): File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 313, in _bootstrap self.run() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 108, in run self._target(*self._args, **self._kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 65, in wrapper raise exp File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 62, in wrapper func(*args, **kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 262, in task_distribute key, func_name, detail = resource_proxy[TASK_QUEUE].get() File "", line 2, in get File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/managers.py", line 835, in _callmethod kind, result = conn.recv() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 250, in recv buf = self._recv_bytes() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 414, in _recv_bytes buf = self._recv(4) File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 383, in _recv raise EOFError EOFError [2024-10-17 19:15:14,723] torch.distributed.elastic.multiprocessing.api: [ERROR] failed (exitcode: 1) local_rank: 8 (pid: 1252) of binary: /root/miniconda3/envs/torch21_python38/bin/python Traceback (most recent call last): File "/root/miniconda3/envs/torch21_python38/bin/torchrun", line 8, in sys.exit(main()) File "/root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages/torch/distributed/elastic/multiprocessing/errors/__init__.py", line 346, in wrapper return f(*args, **kwargs) File "/root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages/torch/distributed/run.py", line 806, in main run(args) File "/root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages/torch/distributed/run.py", line 797, in run elastic_launch( File "/root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages/torch/distributed/launcher/api.py", line 134, in __call__ return launch_agent(self._config, self._entrypoint, list(args)) File "/root/miniconda3/envs/torch21_python38/lib/python3.8/site-packages/torch/distributed/launcher/api.py", line 264, in launch_agent raise ChildFailedError( torch.distributed.elastic.multiprocessing.errors.ChildFailedError: ============================================================ /local_disk/cognitron_vl//lcvlm_modellink/pretrain_lcvlm.py FAILED ------------------------------------------------------------ Failures: ------------------------------------------------------------ Root Cause (first observed failure): [0]: time : 2024-10-17_19:15:13 host : train-1165841964676693248-8uvcht9qqrr4-worker-8 rank : 152 (local_rank: 8) exitcode : 1 (pid: 1252) error_file: traceback : To enable traceback see: https://pytorch.org/docs/stable/elastic/errors.html ============================================================ Process ForkServerProcess-2: Traceback (most recent call last): File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 313, in _bootstrap self.run() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 108, in run self._target(*self._args, **self._kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 65, in wrapper raise exp File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 62, in wrapper func(*args, **kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 262, in task_distribute key, func_name, detail = resource_proxy[TASK_QUEUE].get() File "", line 2, in get File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/managers.py", line 835, in _callmethod kind, result = conn.recv() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 250, in recv buf = self._recv_bytes() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 414, in _recv_bytes buf = self._recv(4) File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 383, in _recv raise EOFError EOFError Process ForkServerProcess-8: Traceback (most recent call last): File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 313, in _bootstrap self.run() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 108, in run self._target(*self._args, **self._kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 65, in wrapper raise exp File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 62, in wrapper func(*args, **kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 262, in task_distribute key, func_name, detail = resource_proxy[TASK_QUEUE].get() File "", line 2, in get File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/managers.py", line 835, in _callmethod kind, result = conn.recv() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 250, in recv buf = self._recv_bytes() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 414, in _recv_bytes buf = self._recv(4) File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 383, in _recv raise EOFError EOFError Process ForkServerProcess-7: Traceback (most recent call last): File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 313, in _bootstrap self.run() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 108, in run self._target(*self._args, **self._kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 65, in wrapper raise exp File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 62, in wrapper func(*args, **kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 262, in task_distribute key, func_name, detail = resource_proxy[TASK_QUEUE].get() File "", line 2, in get File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/managers.py", line 835, in _callmethod kind, result = conn.recv() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 250, in recv buf = self._recv_bytes() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 414, in _recv_bytes buf = self._recv(4) File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 383, in _recv raise EOFError EOFError Process ForkServerProcess-3: Traceback (most recent call last): File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 313, in _bootstrap self.run() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 108, in run self._target(*self._args, **self._kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 65, in wrapper raise exp File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 62, in wrapper func(*args, **kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 262, in task_distribute key, func_name, detail = resource_proxy[TASK_QUEUE].get() File "", line 2, in get File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/managers.py", line 835, in _callmethod kind, result = conn.recv() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 250, in recv buf = self._recv_bytes() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 414, in _recv_bytes buf = self._recv(4) File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 383, in _recv raise EOFError EOFError Process ForkServerProcess-5: Traceback (most recent call last): File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 313, in _bootstrap self.run() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 108, in run self._target(*self._args, **self._kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 65, in wrapper raise exp File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 62, in wrapper func(*args, **kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 262, in task_distribute key, func_name, detail = resource_proxy[TASK_QUEUE].get() File "", line 2, in get File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/managers.py", line 835, in _callmethod kind, result = conn.recv() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 250, in recv buf = self._recv_bytes() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 414, in _recv_bytes buf = self._recv(4) File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 383, in _recv raise EOFError EOFError Process ForkServerProcess-9: Traceback (most recent call last): File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 313, in _bootstrap self.run() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 108, in run self._target(*self._args, **self._kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 65, in wrapper raise exp File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 62, in wrapper func(*args, **kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 262, in task_distribute key, func_name, detail = resource_proxy[TASK_QUEUE].get() File "", line 2, in get File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/managers.py", line 835, in _callmethod kind, result = conn.recv() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 250, in recv buf = self._recv_bytes() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 414, in _recv_bytes buf = self._recv(4) File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 383, in _recv raise EOFError EOFError Process ForkServerProcess-4: Traceback (most recent call last): File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 313, in _bootstrap self.run() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 108, in run self._target(*self._args, **self._kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 65, in wrapper raise exp File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 62, in wrapper func(*args, **kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 262, in task_distribute key, func_name, detail = resource_proxy[TASK_QUEUE].get() File "", line 2, in get File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/managers.py", line 835, in _callmethod kind, result = conn.recv() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 250, in recv buf = self._recv_bytes() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 414, in _recv_bytes buf = self._recv(4) File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 383, in _recv raise EOFError EOFError Process ForkServerProcess-6: Traceback (most recent call last): File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 313, in _bootstrap self.run() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 108, in run self._target(*self._args, **self._kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 65, in wrapper raise exp File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 62, in wrapper func(*args, **kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 262, in task_distribute key, func_name, detail = resource_proxy[TASK_QUEUE].get() File "", line 2, in get File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/managers.py", line 835, in _callmethod kind, result = conn.recv() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 250, in recv buf = self._recv_bytes() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 414, in _recv_bytes buf = self._recv(4) File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 383, in _recv raise EOFError EOFError Process ForkServerProcess-5: Traceback (most recent call last): File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 313, in _bootstrap self.run() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 108, in run self._target(*self._args, **self._kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 65, in wrapper raise exp File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 62, in wrapper func(*args, **kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 262, in task_distribute key, func_name, detail = resource_proxy[TASK_QUEUE].get() File "", line 2, in get File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/managers.py", line 835, in _callmethod kind, result = conn.recv() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 250, in recv buf = self._recv_bytes() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 414, in _recv_bytes buf = self._recv(4) File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 383, in _recv raise EOFError EOFError Process ForkServerProcess-3: Traceback (most recent call last): File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 313, in _bootstrap self.run() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 108, in run self._target(*self._args, **self._kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 65, in wrapper raise exp File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 62, in wrapper func(*args, **kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 262, in task_distribute key, func_name, detail = resource_proxy[TASK_QUEUE].get() File "", line 2, in get File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/managers.py", line 835, in _callmethod kind, result = conn.recv() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 250, in recv buf = self._recv_bytes() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 414, in _recv_bytes buf = self._recv(4) File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 383, in _recv raise EOFError EOFError Process ForkServerProcess-4: Traceback (most recent call last): File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 313, in _bootstrap self.run() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 108, in run self._target(*self._args, **self._kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 65, in wrapper raise exp File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 62, in wrapper func(*args, **kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 262, in task_distribute key, func_name, detail = resource_proxy[TASK_QUEUE].get() File "", line 2, in get File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/managers.py", line 835, in _callmethod kind, result = conn.recv() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 250, in recv buf = self._recv_bytes() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 414, in _recv_bytes buf = self._recv(4) File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 383, in _recv raise EOFError EOFError Process ForkServerProcess-9: Traceback (most recent call last): File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 313, in _bootstrap self.run() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 108, in run self._target(*self._args, **self._kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 65, in wrapper raise exp File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 62, in wrapper func(*args, **kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 262, in task_distribute key, func_name, detail = resource_proxy[TASK_QUEUE].get() File "", line 2, in get File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/managers.py", line 835, in _callmethod kind, result = conn.recv() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 250, in recv buf = self._recv_bytes() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 414, in _recv_bytes buf = self._recv(4) File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 383, in _recv raise EOFError EOFError Process ForkServerProcess-7: Traceback (most recent call last): File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 313, in _bootstrap self.run() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 108, in run self._target(*self._args, **self._kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 65, in wrapper raise exp File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 62, in wrapper func(*args, **kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 262, in task_distribute key, func_name, detail = resource_proxy[TASK_QUEUE].get() File "", line 2, in get File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/managers.py", line 835, in _callmethod kind, result = conn.recv() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 250, in recv buf = self._recv_bytes() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 414, in _recv_bytes buf = self._recv(4) File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 383, in _recv raise EOFError EOFError Process ForkServerProcess-6: Traceback (most recent call last): File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 313, in _bootstrap self.run() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 108, in run self._target(*self._args, **self._kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 65, in wrapper raise exp File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 62, in wrapper func(*args, **kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 262, in task_distribute key, func_name, detail = resource_proxy[TASK_QUEUE].get() File "", line 2, in get File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/managers.py", line 835, in _callmethod kind, result = conn.recv() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 250, in recv buf = self._recv_bytes() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 414, in _recv_bytes buf = self._recv(4) File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 383, in _recv raise EOFError EOFError Process ForkServerProcess-8: Traceback (most recent call last): File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 313, in _bootstrap self.run() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 108, in run self._target(*self._args, **self._kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 65, in wrapper raise exp File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 62, in wrapper func(*args, **kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 262, in task_distribute key, func_name, detail = resource_proxy[TASK_QUEUE].get() File "", line 2, in get File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/managers.py", line 835, in _callmethod kind, result = conn.recv() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 250, in recv buf = self._recv_bytes() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 414, in _recv_bytes buf = self._recv(4) File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 383, in _recv raise EOFError EOFError Process ForkServerProcess-2: Traceback (most recent call last): File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 313, in _bootstrap self.run() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 108, in run self._target(*self._args, **self._kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 65, in wrapper raise exp File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 62, in wrapper func(*args, **kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 262, in task_distribute key, func_name, detail = resource_proxy[TASK_QUEUE].get() File "", line 2, in get File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/managers.py", line 835, in _callmethod kind, result = conn.recv() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 250, in recv buf = self._recv_bytes() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 414, in _recv_bytes buf = self._recv(4) File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 383, in _recv raise EOFError EOFError Process ForkServerProcess-4: Traceback (most recent call last): File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 313, in _bootstrap self.run() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 108, in run self._target(*self._args, **self._kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 65, in wrapper raise exp File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 62, in wrapper func(*args, **kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 262, in task_distribute key, func_name, detail = resource_proxy[TASK_QUEUE].get() File "", line 2, in get File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/managers.py", line 835, in _callmethod kind, result = conn.recv() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 250, in recv buf = self._recv_bytes() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 414, in _recv_bytes buf = self._recv(4) File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 383, in _recv raise EOFError EOFError Process ForkServerProcess-3: Traceback (most recent call last): File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 313, in _bootstrap self.run() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 108, in run self._target(*self._args, **self._kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 65, in wrapper raise exp File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 62, in wrapper func(*args, **kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 262, in task_distribute key, func_name, detail = resource_proxy[TASK_QUEUE].get() File "", line 2, in get File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/managers.py", line 835, in _callmethod kind, result = conn.recv() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 250, in recv buf = self._recv_bytes() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 414, in _recv_bytes buf = self._recv(4) File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 383, in _recv raise EOFError EOFError Process ForkServerProcess-5: Traceback (most recent call last): File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 313, in _bootstrap self.run() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 108, in run self._target(*self._args, **self._kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 65, in wrapper raise exp File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 62, in wrapper func(*args, **kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 262, in task_distribute key, func_name, detail = resource_proxy[TASK_QUEUE].get() File "", line 2, in get File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/managers.py", line 835, in _callmethod kind, result = conn.recv() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 250, in recv buf = self._recv_bytes() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 414, in _recv_bytes buf = self._recv(4) File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 383, in _recv raise EOFError EOFError Process ForkServerProcess-9: Traceback (most recent call last): File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 313, in _bootstrap self.run() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 108, in run self._target(*self._args, **self._kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 65, in wrapper raise exp File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 62, in wrapper func(*args, **kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 262, in task_distribute key, func_name, detail = resource_proxy[TASK_QUEUE].get() File "", line 2, in get File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/managers.py", line 835, in _callmethod kind, result = conn.recv() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 250, in recv buf = self._recv_bytes() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 414, in _recv_bytes buf = self._recv(4) File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 383, in _recv raise EOFError EOFError Process ForkServerProcess-8: Traceback (most recent call last): File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 313, in _bootstrap self.run() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 108, in run self._target(*self._args, **self._kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 65, in wrapper raise exp File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 62, in wrapper func(*args, **kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 262, in task_distribute key, func_name, detail = resource_proxy[TASK_QUEUE].get() File "", line 2, in get File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/managers.py", line 835, in _callmethod kind, result = conn.recv() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 250, in recv buf = self._recv_bytes() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 414, in _recv_bytes buf = self._recv(4) File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 383, in _recv raise EOFError EOFError Process ForkServerProcess-6: Traceback (most recent call last): File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 313, in _bootstrap self.run() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 108, in run self._target(*self._args, **self._kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 65, in wrapper raise exp File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 62, in wrapper func(*args, **kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 262, in task_distribute key, func_name, detail = resource_proxy[TASK_QUEUE].get() File "", line 2, in get File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/managers.py", line 835, in _callmethod kind, result = conn.recv() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 250, in recv buf = self._recv_bytes() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 414, in _recv_bytes buf = self._recv(4) File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 383, in _recv raise EOFError EOFError Process ForkServerProcess-7: Traceback (most recent call last): File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 313, in _bootstrap self.run() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 108, in run self._target(*self._args, **self._kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 65, in wrapper raise exp File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 62, in wrapper func(*args, **kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 262, in task_distribute key, func_name, detail = resource_proxy[TASK_QUEUE].get() File "", line 2, in get File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/managers.py", line 835, in _callmethod kind, result = conn.recv() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 250, in recv buf = self._recv_bytes() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 414, in _recv_bytes buf = self._recv(4) File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 383, in _recv raise EOFError EOFError Process ForkServerProcess-2: Traceback (most recent call last): File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 313, in _bootstrap self.run() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 108, in run self._target(*self._args, **self._kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 65, in wrapper raise exp File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 62, in wrapper func(*args, **kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 262, in task_distribute key, func_name, detail = resource_proxy[TASK_QUEUE].get() File "", line 2, in get File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/managers.py", line 835, in _callmethod kind, result = conn.recv() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 250, in recv buf = self._recv_bytes() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 414, in _recv_bytes buf = self._recv(4) File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 383, in _recv raise EOFError EOFError Process ForkServerProcess-9: Traceback (most recent call last): File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 313, in _bootstrap self.run() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 108, in run self._target(*self._args, **self._kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 65, in wrapper raise exp File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 62, in wrapper func(*args, **kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 262, in task_distribute key, func_name, detail = resource_proxy[TASK_QUEUE].get() File "", line 2, in get File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/managers.py", line 835, in _callmethod kind, result = conn.recv() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 250, in recv buf = self._recv_bytes() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 414, in _recv_bytes buf = self._recv(4) File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 383, in _recv raise EOFError EOFError Process ForkServerProcess-4: Traceback (most recent call last): File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 313, in _bootstrap self.run() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 108, in run self._target(*self._args, **self._kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 65, in wrapper raise exp File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 62, in wrapper func(*args, **kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 262, in task_distribute key, func_name, detail = resource_proxy[TASK_QUEUE].get() File "", line 2, in get File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/managers.py", line 835, in _callmethod kind, result = conn.recv() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 250, in recv buf = self._recv_bytes() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 414, in _recv_bytes buf = self._recv(4) File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 383, in _recv raise EOFError EOFError Process ForkServerProcess-8: Traceback (most recent call last): File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 313, in _bootstrap self.run() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 108, in run self._target(*self._args, **self._kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 65, in wrapper raise exp File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 62, in wrapper func(*args, **kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 262, in task_distribute key, func_name, detail = resource_proxy[TASK_QUEUE].get() File "", line 2, in get File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/managers.py", line 835, in _callmethod kind, result = conn.recv() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 250, in recv buf = self._recv_bytes() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 414, in _recv_bytes buf = self._recv(4) File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 383, in _recv raise EOFError EOFError Process ForkServerProcess-5: Traceback (most recent call last): File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 313, in _bootstrap self.run() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 108, in run self._target(*self._args, **self._kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 65, in wrapper raise exp File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 62, in wrapper func(*args, **kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 262, in task_distribute key, func_name, detail = resource_proxy[TASK_QUEUE].get() File "", line 2, in get File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/managers.py", line 835, in _callmethod kind, result = conn.recv() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 250, in recv buf = self._recv_bytes() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 414, in _recv_bytes buf = self._recv(4) File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 383, in _recv raise EOFError EOFError Process ForkServerProcess-6: Traceback (most recent call last): File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 313, in _bootstrap self.run() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 108, in run self._target(*self._args, **self._kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 65, in wrapper raise exp File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 62, in wrapper func(*args, **kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 262, in task_distribute key, func_name, detail = resource_proxy[TASK_QUEUE].get() File "", line 2, in get File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/managers.py", line 835, in _callmethod kind, result = conn.recv() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 250, in recv buf = self._recv_bytes() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 414, in _recv_bytes buf = self._recv(4) File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 383, in _recv raise EOFError EOFError Process ForkServerProcess-2: Traceback (most recent call last): File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 313, in _bootstrap self.run() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 108, in run self._target(*self._args, **self._kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 65, in wrapper raise exp File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 62, in wrapper func(*args, **kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 262, in task_distribute key, func_name, detail = resource_proxy[TASK_QUEUE].get() File "", line 2, in get File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/managers.py", line 835, in _callmethod kind, result = conn.recv() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 250, in recv buf = self._recv_bytes() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 414, in _recv_bytes buf = self._recv(4) File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 383, in _recv raise EOFError EOFError Process ForkServerProcess-7: Traceback (most recent call last): File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 313, in _bootstrap self.run() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 108, in run self._target(*self._args, **self._kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 65, in wrapper raise exp File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 62, in wrapper func(*args, **kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 262, in task_distribute key, func_name, detail = resource_proxy[TASK_QUEUE].get() File "", line 2, in get File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/managers.py", line 835, in _callmethod kind, result = conn.recv() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 250, in recv buf = self._recv_bytes() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 414, in _recv_bytes buf = self._recv(4) File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 383, in _recv raise EOFError EOFError Process ForkServerProcess-3: Traceback (most recent call last): File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 313, in _bootstrap self.run() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 108, in run self._target(*self._args, **self._kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 65, in wrapper raise exp File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 62, in wrapper func(*args, **kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 262, in task_distribute key, func_name, detail = resource_proxy[TASK_QUEUE].get() File "", line 2, in get File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/managers.py", line 835, in _callmethod kind, result = conn.recv() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 250, in recv buf = self._recv_bytes() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 414, in _recv_bytes buf = self._recv(4) File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 383, in _recv raise EOFError EOFError Process ForkServerProcess-4: Traceback (most recent call last): File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 313, in _bootstrap self.run() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 108, in run self._target(*self._args, **self._kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 65, in wrapper raise exp File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 62, in wrapper func(*args, **kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 262, in task_distribute key, func_name, detail = resource_proxy[TASK_QUEUE].get() File "", line 2, in get File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/managers.py", line 835, in _callmethod kind, result = conn.recv() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 250, in recv buf = self._recv_bytes() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 414, in _recv_bytes buf = self._recv(4) File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 383, in _recv raise EOFError EOFError Process ForkServerProcess-2: Traceback (most recent call last): File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 313, in _bootstrap self.run() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 108, in run self._target(*self._args, **self._kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 65, in wrapper raise exp File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 62, in wrapper func(*args, **kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 262, in task_distribute key, func_name, detail = resource_proxy[TASK_QUEUE].get() File "", line 2, in get File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/managers.py", line 835, in _callmethod kind, result = conn.recv() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 250, in recv buf = self._recv_bytes() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 414, in _recv_bytes buf = self._recv(4) File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 383, in _recv raise EOFError EOFError Process ForkServerProcess-9: Traceback (most recent call last): File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 313, in _bootstrap self.run() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 108, in run self._target(*self._args, **self._kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 65, in wrapper raise exp File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 62, in wrapper func(*args, **kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 262, in task_distribute key, func_name, detail = resource_proxy[TASK_QUEUE].get() File "", line 2, in get File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/managers.py", line 835, in _callmethod kind, result = conn.recv() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 250, in recv buf = self._recv_bytes() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 414, in _recv_bytes buf = self._recv(4) File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 383, in _recv raise EOFError EOFError Process ForkServerProcess-6: Traceback (most recent call last): File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 313, in _bootstrap self.run() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 108, in run self._target(*self._args, **self._kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 65, in wrapper raise exp File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 62, in wrapper func(*args, **kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 262, in task_distribute key, func_name, detail = resource_proxy[TASK_QUEUE].get() File "", line 2, in get File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/managers.py", line 835, in _callmethod kind, result = conn.recv() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 250, in recv buf = self._recv_bytes() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 414, in _recv_bytes buf = self._recv(4) File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 383, in _recv raise EOFError EOFError Process ForkServerProcess-7: Traceback (most recent call last): File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 313, in _bootstrap self.run() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 108, in run self._target(*self._args, **self._kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 65, in wrapper raise exp File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 62, in wrapper func(*args, **kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 262, in task_distribute key, func_name, detail = resource_proxy[TASK_QUEUE].get() File "", line 2, in get File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/managers.py", line 835, in _callmethod kind, result = conn.recv() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 250, in recv buf = self._recv_bytes() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 414, in _recv_bytes buf = self._recv(4) File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 383, in _recv raise EOFError EOFError Process ForkServerProcess-8: Traceback (most recent call last): File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 313, in _bootstrap self.run() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 108, in run self._target(*self._args, **self._kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 65, in wrapper raise exp File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 62, in wrapper func(*args, **kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 262, in task_distribute key, func_name, detail = resource_proxy[TASK_QUEUE].get() File "", line 2, in get File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/managers.py", line 835, in _callmethod kind, result = conn.recv() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 250, in recv buf = self._recv_bytes() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 414, in _recv_bytes buf = self._recv(4) File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 383, in _recv raise EOFError EOFError Process ForkServerProcess-3: Traceback (most recent call last): File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 313, in _bootstrap self.run() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 108, in run self._target(*self._args, **self._kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 65, in wrapper raise exp File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 62, in wrapper func(*args, **kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 262, in task_distribute key, func_name, detail = resource_proxy[TASK_QUEUE].get() File "", line 2, in get File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/managers.py", line 835, in _callmethod kind, result = conn.recv() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 250, in recv buf = self._recv_bytes() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 414, in _recv_bytes buf = self._recv(4) File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 383, in _recv raise EOFError EOFError Process ForkServerProcess-5: Traceback (most recent call last): File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 313, in _bootstrap self.run() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 108, in run self._target(*self._args, **self._kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 65, in wrapper raise exp File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 62, in wrapper func(*args, **kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 262, in task_distribute key, func_name, detail = resource_proxy[TASK_QUEUE].get() File "", line 2, in get File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/managers.py", line 835, in _callmethod kind, result = conn.recv() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 250, in recv buf = self._recv_bytes() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 414, in _recv_bytes buf = self._recv(4) File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 383, in _recv raise EOFError EOFError Process ForkServerProcess-6: Traceback (most recent call last): File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 313, in _bootstrap self.run() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 108, in run self._target(*self._args, **self._kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 65, in wrapper raise exp File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 62, in wrapper func(*args, **kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 262, in task_distribute key, func_name, detail = resource_proxy[TASK_QUEUE].get() File "", line 2, in get File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/managers.py", line 835, in _callmethod kind, result = conn.recv() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 250, in recv buf = self._recv_bytes() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 414, in _recv_bytes buf = self._recv(4) File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 383, in _recv raise EOFError EOFError Process ForkServerProcess-2: Traceback (most recent call last): File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 313, in _bootstrap self.run() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 108, in run self._target(*self._args, **self._kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 65, in wrapper raise exp File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 62, in wrapper func(*args, **kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 262, in task_distribute key, func_name, detail = resource_proxy[TASK_QUEUE].get() File "", line 2, in get File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/managers.py", line 835, in _callmethod kind, result = conn.recv() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 250, in recv buf = self._recv_bytes() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 414, in _recv_bytes buf = self._recv(4) File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 383, in _recv raise EOFError EOFError Process ForkServerProcess-9: Traceback (most recent call last): File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 313, in _bootstrap self.run() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 108, in run self._target(*self._args, **self._kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 65, in wrapper raise exp File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 62, in wrapper func(*args, **kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 262, in task_distribute key, func_name, detail = resource_proxy[TASK_QUEUE].get() File "", line 2, in get File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/managers.py", line 835, in _callmethod kind, result = conn.recv() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 250, in recv buf = self._recv_bytes() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 414, in _recv_bytes buf = self._recv(4) File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 383, in _recv raise EOFError EOFError Process ForkServerProcess-5: Traceback (most recent call last): File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 313, in _bootstrap self.run() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 108, in run self._target(*self._args, **self._kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 65, in wrapper raise exp File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 62, in wrapper func(*args, **kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 262, in task_distribute key, func_name, detail = resource_proxy[TASK_QUEUE].get() File "", line 2, in get File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/managers.py", line 835, in _callmethod kind, result = conn.recv() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 250, in recv buf = self._recv_bytes() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 414, in _recv_bytes buf = self._recv(4) File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 383, in _recv raise EOFError EOFError Process ForkServerProcess-8: Traceback (most recent call last): File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 313, in _bootstrap self.run() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 108, in run self._target(*self._args, **self._kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 65, in wrapper raise exp File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 62, in wrapper func(*args, **kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 262, in task_distribute key, func_name, detail = resource_proxy[TASK_QUEUE].get() File "", line 2, in get File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/managers.py", line 835, in _callmethod kind, result = conn.recv() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 250, in recv buf = self._recv_bytes() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 414, in _recv_bytes buf = self._recv(4) File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 383, in _recv raise EOFError EOFError Process ForkServerProcess-4: Traceback (most recent call last): File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 313, in _bootstrap self.run() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 108, in run self._target(*self._args, **self._kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 65, in wrapper raise exp File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 62, in wrapper func(*args, **kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 262, in task_distribute key, func_name, detail = resource_proxy[TASK_QUEUE].get() File "", line 2, in get File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/managers.py", line 835, in _callmethod kind, result = conn.recv() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 250, in recv buf = self._recv_bytes() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 414, in _recv_bytes buf = self._recv(4) File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 383, in _recv raise EOFError EOFError Process ForkServerProcess-7: Traceback (most recent call last): File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 313, in _bootstrap self.run() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 108, in run self._target(*self._args, **self._kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 65, in wrapper raise exp File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 62, in wrapper func(*args, **kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 262, in task_distribute key, func_name, detail = resource_proxy[TASK_QUEUE].get() File "", line 2, in get File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/managers.py", line 835, in _callmethod kind, result = conn.recv() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 250, in recv buf = self._recv_bytes() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 414, in _recv_bytes buf = self._recv(4) File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 383, in _recv raise EOFError EOFError Process ForkServerProcess-3: Traceback (most recent call last): File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 313, in _bootstrap self.run() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 108, in run self._target(*self._args, **self._kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 65, in wrapper raise exp File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 62, in wrapper func(*args, **kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 262, in task_distribute key, func_name, detail = resource_proxy[TASK_QUEUE].get() File "", line 2, in get File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/managers.py", line 835, in _callmethod kind, result = conn.recv() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 250, in recv buf = self._recv_bytes() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 414, in _recv_bytes buf = self._recv(4) File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 383, in _recv raise EOFError EOFError Process ForkServerProcess-9: Traceback (most recent call last): File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 313, in _bootstrap self.run() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 108, in run self._target(*self._args, **self._kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 65, in wrapper raise exp File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 62, in wrapper func(*args, **kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 262, in task_distribute key, func_name, detail = resource_proxy[TASK_QUEUE].get() File "", line 2, in get File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/managers.py", line 835, in _callmethod kind, result = conn.recv() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 250, in recv buf = self._recv_bytes() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 414, in _recv_bytes buf = self._recv(4) File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 383, in _recv raise EOFError EOFError Process ForkServerProcess-3: Traceback (most recent call last): File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 313, in _bootstrap self.run() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 108, in run self._target(*self._args, **self._kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 65, in wrapper raise exp File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 62, in wrapper func(*args, **kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 262, in task_distribute key, func_name, detail = resource_proxy[TASK_QUEUE].get() File "", line 2, in get File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/managers.py", line 835, in _callmethod kind, result = conn.recv() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 250, in recv buf = self._recv_bytes() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 414, in _recv_bytes buf = self._recv(4) File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 383, in _recv raise EOFError EOFError Process ForkServerProcess-8: Traceback (most recent call last): File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 313, in _bootstrap self.run() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 108, in run self._target(*self._args, **self._kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 65, in wrapper raise exp File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 62, in wrapper func(*args, **kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 262, in task_distribute key, func_name, detail = resource_proxy[TASK_QUEUE].get() File "", line 2, in get File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/managers.py", line 835, in _callmethod kind, result = conn.recv() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 250, in recv buf = self._recv_bytes() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 414, in _recv_bytes buf = self._recv(4) File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 383, in _recv raise EOFError EOFError Process ForkServerProcess-5: Traceback (most recent call last): File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 313, in _bootstrap self.run() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 108, in run self._target(*self._args, **self._kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 65, in wrapper raise exp File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 62, in wrapper func(*args, **kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 262, in task_distribute key, func_name, detail = resource_proxy[TASK_QUEUE].get() File "", line 2, in get File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/managers.py", line 835, in _callmethod kind, result = conn.recv() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 250, in recv buf = self._recv_bytes() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 414, in _recv_bytes buf = self._recv(4) File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 383, in _recv raise EOFError EOFError Process ForkServerProcess-2: Traceback (most recent call last): File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 313, in _bootstrap self.run() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 108, in run self._target(*self._args, **self._kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 65, in wrapper raise exp File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 62, in wrapper func(*args, **kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 262, in task_distribute key, func_name, detail = resource_proxy[TASK_QUEUE].get() File "", line 2, in get File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/managers.py", line 835, in _callmethod kind, result = conn.recv() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 250, in recv buf = self._recv_bytes() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 414, in _recv_bytes buf = self._recv(4) File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 383, in _recv raise EOFError EOFError Process ForkServerProcess-4: Traceback (most recent call last): File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 313, in _bootstrap self.run() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 108, in run self._target(*self._args, **self._kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 65, in wrapper raise exp File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 62, in wrapper func(*args, **kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 262, in task_distribute key, func_name, detail = resource_proxy[TASK_QUEUE].get() File "", line 2, in get File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/managers.py", line 835, in _callmethod kind, result = conn.recv() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 250, in recv buf = self._recv_bytes() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 414, in _recv_bytes buf = self._recv(4) File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 383, in _recv raise EOFError EOFError Process ForkServerProcess-6: Traceback (most recent call last): File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 313, in _bootstrap self.run() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 108, in run self._target(*self._args, **self._kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 65, in wrapper raise exp File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 62, in wrapper func(*args, **kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 262, in task_distribute key, func_name, detail = resource_proxy[TASK_QUEUE].get() File "", line 2, in get File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/managers.py", line 835, in _callmethod kind, result = conn.recv() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 250, in recv buf = self._recv_bytes() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 414, in _recv_bytes buf = self._recv(4) File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 383, in _recv raise EOFError EOFError Process ForkServerProcess-7: Traceback (most recent call last): File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 313, in _bootstrap self.run() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 108, in run self._target(*self._args, **self._kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 65, in wrapper raise exp File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 62, in wrapper func(*args, **kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 262, in task_distribute key, func_name, detail = resource_proxy[TASK_QUEUE].get() File "", line 2, in get File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/managers.py", line 835, in _callmethod kind, result = conn.recv() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 250, in recv buf = self._recv_bytes() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 414, in _recv_bytes buf = self._recv(4) File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 383, in _recv raise EOFError EOFError Process ForkServerProcess-3: Traceback (most recent call last): File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 313, in _bootstrap self.run() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 108, in run self._target(*self._args, **self._kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 65, in wrapper raise exp File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 62, in wrapper func(*args, **kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 262, in task_distribute key, func_name, detail = resource_proxy[TASK_QUEUE].get() File "", line 2, in get File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/managers.py", line 835, in _callmethod kind, result = conn.recv() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 250, in recv buf = self._recv_bytes() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 414, in _recv_bytes buf = self._recv(4) File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 383, in _recv raise EOFError EOFError Process ForkServerProcess-7: Traceback (most recent call last): File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 313, in _bootstrap self.run() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 108, in run self._target(*self._args, **self._kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 65, in wrapper raise exp File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 62, in wrapper func(*args, **kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 262, in task_distribute key, func_name, detail = resource_proxy[TASK_QUEUE].get() File "", line 2, in get File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/managers.py", line 835, in _callmethod kind, result = conn.recv() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 250, in recv buf = self._recv_bytes() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 414, in _recv_bytes buf = self._recv(4) File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 383, in _recv raise EOFError EOFError Process ForkServerProcess-4: Traceback (most recent call last): File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 313, in _bootstrap self.run() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 108, in run self._target(*self._args, **self._kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 65, in wrapper raise exp File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 62, in wrapper func(*args, **kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 262, in task_distribute key, func_name, detail = resource_proxy[TASK_QUEUE].get() File "", line 2, in get File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/managers.py", line 835, in _callmethod kind, result = conn.recv() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 250, in recv buf = self._recv_bytes() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 414, in _recv_bytes buf = self._recv(4) File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 383, in _recv raise EOFError EOFError Process ForkServerProcess-8: Traceback (most recent call last): File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 313, in _bootstrap self.run() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 108, in run self._target(*self._args, **self._kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 65, in wrapper raise exp File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 62, in wrapper func(*args, **kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 262, in task_distribute key, func_name, detail = resource_proxy[TASK_QUEUE].get() File "", line 2, in get File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/managers.py", line 835, in _callmethod kind, result = conn.recv() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 250, in recv buf = self._recv_bytes() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 414, in _recv_bytes buf = self._recv(4) File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 383, in _recv raise EOFError EOFError Process ForkServerProcess-5: Traceback (most recent call last): File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 313, in _bootstrap self.run() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 108, in run self._target(*self._args, **self._kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 65, in wrapper raise exp File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 62, in wrapper func(*args, **kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 262, in task_distribute key, func_name, detail = resource_proxy[TASK_QUEUE].get() File "", line 2, in get File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/managers.py", line 835, in _callmethod kind, result = conn.recv() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 250, in recv buf = self._recv_bytes() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 414, in _recv_bytes buf = self._recv(4) File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 383, in _recv raise EOFError EOFError Process ForkServerProcess-2: Traceback (most recent call last): File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 313, in _bootstrap self.run() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 108, in run self._target(*self._args, **self._kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 65, in wrapper raise exp File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 62, in wrapper func(*args, **kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 262, in task_distribute key, func_name, detail = resource_proxy[TASK_QUEUE].get() File "", line 2, in get File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/managers.py", line 835, in _callmethod kind, result = conn.recv() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 250, in recv buf = self._recv_bytes() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 414, in _recv_bytes buf = self._recv(4) File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 383, in _recv raise EOFError EOFError Process ForkServerProcess-9: Traceback (most recent call last): File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 313, in _bootstrap self.run() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 108, in run self._target(*self._args, **self._kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 65, in wrapper raise exp File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 62, in wrapper func(*args, **kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 262, in task_distribute key, func_name, detail = resource_proxy[TASK_QUEUE].get() File "", line 2, in get File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/managers.py", line 835, in _callmethod kind, result = conn.recv() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 250, in recv buf = self._recv_bytes() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 414, in _recv_bytes buf = self._recv(4) File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 383, in _recv raise EOFError EOFError Process ForkServerProcess-6: Traceback (most recent call last): File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 313, in _bootstrap self.run() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 108, in run self._target(*self._args, **self._kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 65, in wrapper raise exp File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 62, in wrapper func(*args, **kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 262, in task_distribute key, func_name, detail = resource_proxy[TASK_QUEUE].get() File "", line 2, in get File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/managers.py", line 835, in _callmethod kind, result = conn.recv() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 250, in recv buf = self._recv_bytes() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 414, in _recv_bytes buf = self._recv(4) File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 383, in _recv raise EOFError EOFError Process ForkServerProcess-5: Traceback (most recent call last): File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 313, in _bootstrap self.run() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 108, in run self._target(*self._args, **self._kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 65, in wrapper raise exp File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 62, in wrapper func(*args, **kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 262, in task_distribute key, func_name, detail = resource_proxy[TASK_QUEUE].get() File "", line 2, in get File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/managers.py", line 835, in _callmethod kind, result = conn.recv() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 250, in recv buf = self._recv_bytes() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 414, in _recv_bytes buf = self._recv(4) File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 383, in _recv raise EOFError EOFError Process ForkServerProcess-2: Traceback (most recent call last): File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 313, in _bootstrap self.run() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 108, in run self._target(*self._args, **self._kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 65, in wrapper raise exp File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 62, in wrapper func(*args, **kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 262, in task_distribute key, func_name, detail = resource_proxy[TASK_QUEUE].get() File "", line 2, in get File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/managers.py", line 835, in _callmethod kind, result = conn.recv() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 250, in recv buf = self._recv_bytes() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 414, in _recv_bytes buf = self._recv(4) File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 383, in _recv raise EOFError EOFError Process ForkServerProcess-4: Traceback (most recent call last): File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 313, in _bootstrap self.run() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 108, in run self._target(*self._args, **self._kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 65, in wrapper raise exp File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 62, in wrapper func(*args, **kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 262, in task_distribute key, func_name, detail = resource_proxy[TASK_QUEUE].get() File "", line 2, in get File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/managers.py", line 835, in _callmethod kind, result = conn.recv() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 250, in recv buf = self._recv_bytes() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 414, in _recv_bytes buf = self._recv(4) File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 383, in _recv raise EOFError EOFError Process ForkServerProcess-7: Traceback (most recent call last): File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 313, in _bootstrap self.run() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 108, in run self._target(*self._args, **self._kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 65, in wrapper raise exp File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 62, in wrapper func(*args, **kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 262, in task_distribute key, func_name, detail = resource_proxy[TASK_QUEUE].get() File "", line 2, in get File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/managers.py", line 835, in _callmethod kind, result = conn.recv() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 250, in recv buf = self._recv_bytes() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 414, in _recv_bytes buf = self._recv(4) File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 383, in _recv raise EOFError EOFError Process ForkServerProcess-8: Traceback (most recent call last): File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 313, in _bootstrap self.run() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 108, in run self._target(*self._args, **self._kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 65, in wrapper raise exp File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 62, in wrapper func(*args, **kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 262, in task_distribute key, func_name, detail = resource_proxy[TASK_QUEUE].get() File "", line 2, in get File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/managers.py", line 835, in _callmethod kind, result = conn.recv() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 250, in recv buf = self._recv_bytes() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 414, in _recv_bytes buf = self._recv(4) File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 383, in _recv raise EOFError EOFError Process ForkServerProcess-3: Traceback (most recent call last): File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 313, in _bootstrap self.run() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 108, in run self._target(*self._args, **self._kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 65, in wrapper raise exp File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 62, in wrapper func(*args, **kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 262, in task_distribute key, func_name, detail = resource_proxy[TASK_QUEUE].get() File "", line 2, in get File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/managers.py", line 835, in _callmethod kind, result = conn.recv() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 250, in recv buf = self._recv_bytes() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 414, in _recv_bytes buf = self._recv(4) File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 383, in _recv raise EOFError EOFError Process ForkServerProcess-9: Traceback (most recent call last): File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 313, in _bootstrap self.run() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 108, in run self._target(*self._args, **self._kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 65, in wrapper raise exp File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 62, in wrapper func(*args, **kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 262, in task_distribute key, func_name, detail = resource_proxy[TASK_QUEUE].get() File "", line 2, in get File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/managers.py", line 835, in _callmethod kind, result = conn.recv() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 250, in recv buf = self._recv_bytes() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 414, in _recv_bytes buf = self._recv(4) File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 383, in _recv raise EOFError EOFError Process ForkServerProcess-6: Traceback (most recent call last): File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 313, in _bootstrap self.run() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 108, in run self._target(*self._args, **self._kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 65, in wrapper raise exp File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 62, in wrapper func(*args, **kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 262, in task_distribute key, func_name, detail = resource_proxy[TASK_QUEUE].get() File "", line 2, in get File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/managers.py", line 835, in _callmethod kind, result = conn.recv() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 250, in recv buf = self._recv_bytes() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 414, in _recv_bytes buf = self._recv(4) File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 383, in _recv raise EOFError EOFError Process ForkServerProcess-4: Traceback (most recent call last): File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 313, in _bootstrap self.run() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 108, in run self._target(*self._args, **self._kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 65, in wrapper raise exp File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 62, in wrapper func(*args, **kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 262, in task_distribute key, func_name, detail = resource_proxy[TASK_QUEUE].get() File "", line 2, in get File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/managers.py", line 835, in _callmethod kind, result = conn.recv() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 250, in recv buf = self._recv_bytes() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 414, in _recv_bytes buf = self._recv(4) File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 383, in _recv raise EOFError EOFError Process ForkServerProcess-6: Traceback (most recent call last): File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 313, in _bootstrap self.run() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 108, in run self._target(*self._args, **self._kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 65, in wrapper raise exp File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 62, in wrapper func(*args, **kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 262, in task_distribute key, func_name, detail = resource_proxy[TASK_QUEUE].get() File "", line 2, in get File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/managers.py", line 835, in _callmethod kind, result = conn.recv() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 250, in recv buf = self._recv_bytes() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 414, in _recv_bytes buf = self._recv(4) File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 383, in _recv raise EOFError EOFError Process ForkServerProcess-3: Traceback (most recent call last): File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 313, in _bootstrap self.run() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 108, in run self._target(*self._args, **self._kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 65, in wrapper raise exp File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 62, in wrapper func(*args, **kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 262, in task_distribute key, func_name, detail = resource_proxy[TASK_QUEUE].get() File "", line 2, in get File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/managers.py", line 835, in _callmethod kind, result = conn.recv() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 250, in recv buf = self._recv_bytes() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 414, in _recv_bytes buf = self._recv(4) File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 383, in _recv raise EOFError EOFError Process ForkServerProcess-2: Traceback (most recent call last): File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 313, in _bootstrap self.run() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 108, in run self._target(*self._args, **self._kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 65, in wrapper raise exp File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 62, in wrapper func(*args, **kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 262, in task_distribute key, func_name, detail = resource_proxy[TASK_QUEUE].get() File "", line 2, in get File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/managers.py", line 835, in _callmethod kind, result = conn.recv() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 250, in recv buf = self._recv_bytes() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 414, in _recv_bytes buf = self._recv(4) File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 383, in _recv raise EOFError EOFError Process ForkServerProcess-7: Traceback (most recent call last): File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 313, in _bootstrap self.run() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 108, in run self._target(*self._args, **self._kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 65, in wrapper raise exp File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 62, in wrapper func(*args, **kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 262, in task_distribute key, func_name, detail = resource_proxy[TASK_QUEUE].get() File "", line 2, in get File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/managers.py", line 835, in _callmethod kind, result = conn.recv() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 250, in recv buf = self._recv_bytes() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 414, in _recv_bytes buf = self._recv(4) File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 383, in _recv raise EOFError EOFError Process ForkServerProcess-8: Traceback (most recent call last): File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 313, in _bootstrap self.run() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 108, in run self._target(*self._args, **self._kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 65, in wrapper raise exp File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 62, in wrapper func(*args, **kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 262, in task_distribute key, func_name, detail = resource_proxy[TASK_QUEUE].get() File "", line 2, in get File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/managers.py", line 835, in _callmethod kind, result = conn.recv() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 250, in recv buf = self._recv_bytes() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 414, in _recv_bytes buf = self._recv(4) File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 383, in _recv raise EOFError EOFError Process ForkServerProcess-9: Traceback (most recent call last): File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 313, in _bootstrap self.run() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 108, in run self._target(*self._args, **self._kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 65, in wrapper raise exp File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 62, in wrapper func(*args, **kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 262, in task_distribute key, func_name, detail = resource_proxy[TASK_QUEUE].get() File "", line 2, in get File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/managers.py", line 835, in _callmethod kind, result = conn.recv() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 250, in recv buf = self._recv_bytes() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 414, in _recv_bytes buf = self._recv(4) File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 383, in _recv raise EOFError EOFError Process ForkServerProcess-5: Traceback (most recent call last): File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 313, in _bootstrap self.run() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 108, in run self._target(*self._args, **self._kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 65, in wrapper raise exp File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 62, in wrapper func(*args, **kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 262, in task_distribute key, func_name, detail = resource_proxy[TASK_QUEUE].get() File "", line 2, in get File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/managers.py", line 835, in _callmethod kind, result = conn.recv() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 250, in recv buf = self._recv_bytes() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 414, in _recv_bytes buf = self._recv(4) File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 383, in _recv raise EOFError EOFError Process ForkServerProcess-2: Traceback (most recent call last): File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 313, in _bootstrap self.run() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 108, in run self._target(*self._args, **self._kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 65, in wrapper raise exp File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 62, in wrapper func(*args, **kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 262, in task_distribute key, func_name, detail = resource_proxy[TASK_QUEUE].get() File "", line 2, in get File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/managers.py", line 835, in _callmethod kind, result = conn.recv() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 250, in recv buf = self._recv_bytes() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 414, in _recv_bytes buf = self._recv(4) File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 383, in _recv raise EOFError EOFError Process ForkServerProcess-5: Traceback (most recent call last): File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 313, in _bootstrap self.run() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 108, in run self._target(*self._args, **self._kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 65, in wrapper raise exp File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 62, in wrapper func(*args, **kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 262, in task_distribute key, func_name, detail = resource_proxy[TASK_QUEUE].get() File "", line 2, in get File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/managers.py", line 835, in _callmethod kind, result = conn.recv() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 250, in recv buf = self._recv_bytes() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 414, in _recv_bytes buf = self._recv(4) File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 383, in _recv raise EOFError EOFError Process ForkServerProcess-7: Traceback (most recent call last): File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 313, in _bootstrap self.run() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 108, in run self._target(*self._args, **self._kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 65, in wrapper raise exp File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 62, in wrapper func(*args, **kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 262, in task_distribute key, func_name, detail = resource_proxy[TASK_QUEUE].get() File "", line 2, in get File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/managers.py", line 835, in _callmethod kind, result = conn.recv() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 250, in recv buf = self._recv_bytes() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 414, in _recv_bytes buf = self._recv(4) File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 383, in _recv raise EOFError EOFError Process ForkServerProcess-9: Traceback (most recent call last): File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 313, in _bootstrap self.run() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 108, in run self._target(*self._args, **self._kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 65, in wrapper raise exp File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 62, in wrapper func(*args, **kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 262, in task_distribute key, func_name, detail = resource_proxy[TASK_QUEUE].get() File "", line 2, in get File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/managers.py", line 835, in _callmethod kind, result = conn.recv() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 250, in recv buf = self._recv_bytes() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 414, in _recv_bytes buf = self._recv(4) File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 383, in _recv raise EOFError EOFError Process ForkServerProcess-8: Traceback (most recent call last): File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 313, in _bootstrap self.run() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 108, in run self._target(*self._args, **self._kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 65, in wrapper raise exp File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 62, in wrapper func(*args, **kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 262, in task_distribute key, func_name, detail = resource_proxy[TASK_QUEUE].get() File "", line 2, in get File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/managers.py", line 835, in _callmethod kind, result = conn.recv() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 250, in recv buf = self._recv_bytes() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 414, in _recv_bytes buf = self._recv(4) File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 383, in _recv raise EOFError EOFError Process ForkServerProcess-3: Traceback (most recent call last): File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 313, in _bootstrap self.run() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 108, in run self._target(*self._args, **self._kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 65, in wrapper raise exp File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 62, in wrapper func(*args, **kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 262, in task_distribute key, func_name, detail = resource_proxy[TASK_QUEUE].get() File "", line 2, in get File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/managers.py", line 835, in _callmethod kind, result = conn.recv() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 250, in recv buf = self._recv_bytes() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 414, in _recv_bytes buf = self._recv(4) File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 383, in _recv raise EOFError EOFError Process ForkServerProcess-4: Traceback (most recent call last): File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 313, in _bootstrap self.run() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 108, in run self._target(*self._args, **self._kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 65, in wrapper raise exp File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 62, in wrapper func(*args, **kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 262, in task_distribute key, func_name, detail = resource_proxy[TASK_QUEUE].get() File "", line 2, in get File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/managers.py", line 835, in _callmethod kind, result = conn.recv() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 250, in recv buf = self._recv_bytes() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 414, in _recv_bytes buf = self._recv(4) File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 383, in _recv raise EOFError EOFError Process ForkServerProcess-6: Traceback (most recent call last): File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 313, in _bootstrap self.run() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 108, in run self._target(*self._args, **self._kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 65, in wrapper raise exp File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 62, in wrapper func(*args, **kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 262, in task_distribute key, func_name, detail = resource_proxy[TASK_QUEUE].get() File "", line 2, in get File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/managers.py", line 835, in _callmethod kind, result = conn.recv() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 250, in recv buf = self._recv_bytes() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 414, in _recv_bytes buf = self._recv(4) File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 383, in _recv raise EOFError EOFError Process ForkServerProcess-9: Traceback (most recent call last): File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 313, in _bootstrap self.run() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 108, in run self._target(*self._args, **self._kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 65, in wrapper raise exp File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 62, in wrapper func(*args, **kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 262, in task_distribute key, func_name, detail = resource_proxy[TASK_QUEUE].get() File "", line 2, in get File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/managers.py", line 835, in _callmethod kind, result = conn.recv() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 250, in recv buf = self._recv_bytes() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 414, in _recv_bytes buf = self._recv(4) File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 383, in _recv raise EOFError EOFError Process ForkServerProcess-6: Traceback (most recent call last): File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 313, in _bootstrap self.run() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 108, in run self._target(*self._args, **self._kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 65, in wrapper raise exp File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 62, in wrapper func(*args, **kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 262, in task_distribute key, func_name, detail = resource_proxy[TASK_QUEUE].get() File "", line 2, in get File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/managers.py", line 835, in _callmethod kind, result = conn.recv() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 250, in recv buf = self._recv_bytes() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 414, in _recv_bytes buf = self._recv(4) File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 383, in _recv raise EOFError EOFError Process ForkServerProcess-8: Traceback (most recent call last): File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 313, in _bootstrap self.run() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 108, in run self._target(*self._args, **self._kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 65, in wrapper raise exp File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 62, in wrapper func(*args, **kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 262, in task_distribute key, func_name, detail = resource_proxy[TASK_QUEUE].get() File "", line 2, in get File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/managers.py", line 835, in _callmethod kind, result = conn.recv() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 250, in recv buf = self._recv_bytes() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 414, in _recv_bytes buf = self._recv(4) File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 383, in _recv raise EOFError EOFError Process ForkServerProcess-2: Traceback (most recent call last): File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 313, in _bootstrap self.run() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 108, in run self._target(*self._args, **self._kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 65, in wrapper raise exp File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 62, in wrapper func(*args, **kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 262, in task_distribute key, func_name, detail = resource_proxy[TASK_QUEUE].get() File "", line 2, in get File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/managers.py", line 835, in _callmethod kind, result = conn.recv() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 250, in recv buf = self._recv_bytes() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 414, in _recv_bytes buf = self._recv(4) File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 383, in _recv raise EOFError EOFError Process ForkServerProcess-4: Traceback (most recent call last): File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 313, in _bootstrap self.run() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 108, in run self._target(*self._args, **self._kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 65, in wrapper raise exp File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 62, in wrapper func(*args, **kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 262, in task_distribute key, func_name, detail = resource_proxy[TASK_QUEUE].get() File "", line 2, in get File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/managers.py", line 835, in _callmethod kind, result = conn.recv() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 250, in recv buf = self._recv_bytes() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 414, in _recv_bytes buf = self._recv(4) File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 383, in _recv raise EOFError EOFError Process ForkServerProcess-5: Traceback (most recent call last): File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 313, in _bootstrap self.run() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 108, in run self._target(*self._args, **self._kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 65, in wrapper raise exp File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 62, in wrapper func(*args, **kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 262, in task_distribute key, func_name, detail = resource_proxy[TASK_QUEUE].get() File "", line 2, in get File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/managers.py", line 835, in _callmethod kind, result = conn.recv() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 250, in recv buf = self._recv_bytes() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 414, in _recv_bytes buf = self._recv(4) File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 383, in _recv raise EOFError EOFError Process ForkServerProcess-7: Traceback (most recent call last): File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 313, in _bootstrap self.run() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 108, in run self._target(*self._args, **self._kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 65, in wrapper raise exp File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 62, in wrapper func(*args, **kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 262, in task_distribute key, func_name, detail = resource_proxy[TASK_QUEUE].get() File "", line 2, in get File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/managers.py", line 835, in _callmethod kind, result = conn.recv() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 250, in recv buf = self._recv_bytes() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 414, in _recv_bytes buf = self._recv(4) File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 383, in _recv raise EOFError EOFError Process ForkServerProcess-3: Traceback (most recent call last): File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 313, in _bootstrap self.run() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/process.py", line 108, in run self._target(*self._args, **self._kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 65, in wrapper raise exp File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 62, in wrapper func(*args, **kwargs) File "/usr/local/Ascend/ascend-toolkit/latest/python/site-packages/tbe/common/repository_manager/route.py", line 262, in task_distribute key, func_name, detail = resource_proxy[TASK_QUEUE].get() File "", line 2, in get File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/managers.py", line 835, in _callmethod kind, result = conn.recv() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 250, in recv buf = self._recv_bytes() File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 414, in _recv_bytes buf = self._recv(4) File "/root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/connection.py", line 383, in _recv raise EOFError EOFError /root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/resource_tracker.py:203: UserWarning: resource_tracker: There appear to be 30 leaked semaphore objects to clean up at shutdown warnings.warn('resource_tracker: There appear to be %d ' /root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/resource_tracker.py:203: UserWarning: resource_tracker: There appear to be 30 leaked semaphore objects to clean up at shutdown warnings.warn('resource_tracker: There appear to be %d ' /root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/resource_tracker.py:203: UserWarning: resource_tracker: There appear to be 30 leaked semaphore objects to clean up at shutdown warnings.warn('resource_tracker: There appear to be %d ' /root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/resource_tracker.py:203: UserWarning: resource_tracker: There appear to be 30 leaked semaphore objects to clean up at shutdown warnings.warn('resource_tracker: There appear to be %d ' /root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/resource_tracker.py:203: UserWarning: resource_tracker: There appear to be 30 leaked semaphore objects to clean up at shutdown warnings.warn('resource_tracker: There appear to be %d ' /root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/resource_tracker.py:203: UserWarning: resource_tracker: There appear to be 30 leaked semaphore objects to clean up at shutdown warnings.warn('resource_tracker: There appear to be %d ' /root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/resource_tracker.py:203: UserWarning: resource_tracker: There appear to be 30 leaked semaphore objects to clean up at shutdown warnings.warn('resource_tracker: There appear to be %d ' /root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/resource_tracker.py:203: UserWarning: resource_tracker: There appear to be 30 leaked semaphore objects to clean up at shutdown warnings.warn('resource_tracker: There appear to be %d ' /root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/resource_tracker.py:203: UserWarning: resource_tracker: There appear to be 30 leaked semaphore objects to clean up at shutdown warnings.warn('resource_tracker: There appear to be %d ' /root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/resource_tracker.py:203: UserWarning: resource_tracker: There appear to be 30 leaked semaphore objects to clean up at shutdown warnings.warn('resource_tracker: There appear to be %d ' /root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/resource_tracker.py:203: UserWarning: resource_tracker: There appear to be 30 leaked semaphore objects to clean up at shutdown warnings.warn('resource_tracker: There appear to be %d ' /root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/resource_tracker.py:203: UserWarning: resource_tracker: There appear to be 30 leaked semaphore objects to clean up at shutdown warnings.warn('resource_tracker: There appear to be %d ' /root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/resource_tracker.py:203: UserWarning: resource_tracker: There appear to be 30 leaked semaphore objects to clean up at shutdown warnings.warn('resource_tracker: There appear to be %d ' /root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/resource_tracker.py:203: UserWarning: resource_tracker: There appear to be 30 leaked semaphore objects to clean up at shutdown warnings.warn('resource_tracker: There appear to be %d ' /root/miniconda3/envs/torch21_python38/lib/python3.8/multiprocessing/resource_tracker.py:203: UserWarning: resource_tracker: There appear to be 30 leaked semaphore objects to clean up at shutdown warnings.warn('resource_tracker: There appear to be %d '