htlou commited on
Commit
6e45475
1 Parent(s): 41d93a3
.gitignore ADDED
@@ -0,0 +1,2 @@
 
 
 
1
+ wandb/
2
+ script.sh
arguments.yaml ADDED
@@ -0,0 +1,49 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ data_cfgs:
2
+ eval_data_files: null
3
+ eval_datasets: null
4
+ eval_optional_args: []
5
+ eval_size: null
6
+ eval_split: null
7
+ eval_subset: null
8
+ eval_template: null
9
+ train_data_files: 8713_tokenized_v2.pt
10
+ train_datasets: /aifs4su/yaodong/datasets/llava_annotated
11
+ train_optional_args: []
12
+ train_size: null
13
+ train_split: train
14
+ train_subset: null
15
+ train_template: ANYTHING_TI2TI
16
+ logger_cfgs:
17
+ cache_dir: null
18
+ log_project: align-anything
19
+ log_run_name: sft
20
+ log_type: wandb
21
+ output_dir: ../outputs/sft_chameleon_0727_0802_v2.1_1e-4
22
+ save_interval: 500.0
23
+ model_cfgs:
24
+ model_max_length: 4096
25
+ model_name_or_path: /aifs4su/yaodong/projects/hantao/anole/facilitating_image_generation/model/chameleon_hf_0727
26
+ trust_remote_code: true
27
+ special_tokens: null
28
+ train_cfgs:
29
+ adam_betas:
30
+ - 0.9
31
+ - 0.95
32
+ adam_epsilon: 1.0e-08
33
+ bf16: true
34
+ ds_cfgs: ds_z3_config.json
35
+ epochs: 3
36
+ eval_interval: 1000
37
+ eval_strategy: steps
38
+ fp16: false
39
+ freeze_language_model: false
40
+ gradient_accumulation_steps: 2.0
41
+ gradient_checkpointing: true
42
+ learning_rate: 0.0001
43
+ lr_scheduler_type: cosine
44
+ lr_warmup_ratio: 0.03
45
+ max_grad_norm: 1.0
46
+ per_device_eval_batch_size: 2.0
47
+ per_device_train_batch_size: 2.0
48
+ seed: 42
49
+ weight_decay: 0.0
config.json ADDED
The diff for this file is too large to render. See raw diff
 
environ.txt ADDED
@@ -0,0 +1,166 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ BASH_FUNC__module_raw%%=() { unset _mlshdbg;
2
+ if [ "${MODULES_SILENT_SHELL_DEBUG:-0}" = '1' ]; then
3
+ case "$-" in
4
+ *v*x*)
5
+ set +vx;
6
+ _mlshdbg='vx'
7
+ ;;
8
+ *v*)
9
+ set +v;
10
+ _mlshdbg='v'
11
+ ;;
12
+ *x*)
13
+ set +x;
14
+ _mlshdbg='x'
15
+ ;;
16
+ *)
17
+ _mlshdbg=''
18
+ ;;
19
+ esac;
20
+ fi;
21
+ unset _mlre _mlIFS;
22
+ if [ -n "${IFS+x}" ]; then
23
+ _mlIFS=$IFS;
24
+ fi;
25
+ IFS=' ';
26
+ for _mlv in ${MODULES_RUN_QUARANTINE:-};
27
+ do
28
+ if [ "${_mlv}" = "${_mlv##*[!A-Za-z0-9_]}" -a "${_mlv}" = "${_mlv#[0-9]}" ]; then
29
+ if [ -n "`eval 'echo ${'$_mlv'+x}'`" ]; then
30
+ _mlre="${_mlre:-}${_mlv}_modquar='`eval 'echo ${'$_mlv'}'`' ";
31
+ fi;
32
+ _mlrv="MODULES_RUNENV_${_mlv}";
33
+ _mlre="${_mlre:-}${_mlv}='`eval 'echo ${'$_mlrv':-}'`' ";
34
+ fi;
35
+ done;
36
+ if [ -n "${_mlre:-}" ]; then
37
+ eval `eval ${_mlre} /usr/bin/tclsh /cm/local/apps/environment-modules/4.5.3/libexec/modulecmd.tcl bash '"$@"'`;
38
+ else
39
+ eval `/usr/bin/tclsh /cm/local/apps/environment-modules/4.5.3/libexec/modulecmd.tcl bash "$@"`;
40
+ fi;
41
+ _mlstatus=$?;
42
+ if [ -n "${_mlIFS+x}" ]; then
43
+ IFS=$_mlIFS;
44
+ else
45
+ unset IFS;
46
+ fi;
47
+ unset _mlre _mlv _mlrv _mlIFS;
48
+ if [ -n "${_mlshdbg:-}" ]; then
49
+ set -$_mlshdbg;
50
+ fi;
51
+ unset _mlshdbg;
52
+ return $_mlstatus
53
+ }
54
+ BASH_FUNC_ml%%=() { module ml "$@"
55
+ }
56
+ BASH_FUNC_module%%=() { _module_raw "$@" 2>&1
57
+ }
58
+ BASH_FUNC_switchml%%=() { typeset swfound=1;
59
+ if [ "${MODULES_USE_COMPAT_VERSION:-0}" = '1' ]; then
60
+ typeset swname='main';
61
+ if [ -e /cm/local/apps/environment-modules/4.5.3/libexec/modulecmd.tcl ]; then
62
+ typeset swfound=0;
63
+ unset MODULES_USE_COMPAT_VERSION;
64
+ fi;
65
+ else
66
+ typeset swname='compatibility';
67
+ if [ -e /cm/local/apps/environment-modules/4.5.3/libexec/modulecmd-compat ]; then
68
+ typeset swfound=0;
69
+ MODULES_USE_COMPAT_VERSION=1;
70
+ export MODULES_USE_COMPAT_VERSION;
71
+ fi;
72
+ fi;
73
+ if [ $swfound -eq 0 ]; then
74
+ echo "Switching to Modules $swname version";
75
+ source /cm/local/apps/environment-modules/4.5.3/init/bash;
76
+ else
77
+ echo "Cannot switch to Modules $swname version, command not found";
78
+ return 1;
79
+ fi
80
+ }
81
+ CMD_WLM_CLUSTER_NAME=slurm
82
+ CONDA_DEFAULT_ENV=hantao_new
83
+ CONDA_EXE=/aifs4su/yaodong/miniconda3/bin/conda
84
+ CONDA_MKL_INTERFACE_LAYER_BACKUP=
85
+ CONDA_PREFIX=/aifs4su/yaodong/miniconda3/envs/hantao_new
86
+ CONDA_PREFIX_1=/aifs4su/yaodong/miniconda3
87
+ CONDA_PROMPT_MODIFIER=(hantao_new)
88
+ CONDA_PYTHON_EXE=/aifs4su/yaodong/miniconda3/bin/python
89
+ CONDA_SHLVL=2
90
+ CPATH=/cm/shared/apps/slurm/current/include
91
+ CPATH_modshare=/cm/shared/apps/slurm/current/include:1
92
+ CROSS_RANK=0
93
+ CROSS_SIZE=1
94
+ CUDA_HOME=/aifs4su/yaodong/miniconda3/envs/hantao_new
95
+ CUDA_MODULE_LOADING=LAZY
96
+ CUDA_VISIBLE_DEVICES=0,1,2,3,4,5,6,7
97
+ DBUS_SESSION_BUS_ADDRESS=unix:path=/run/user/1028/bus
98
+ ENABLE_LMOD=0
99
+ GSETTINGS_SCHEMA_DIR=/aifs4su/yaodong/miniconda3/envs/hantao_new/share/glib-2.0/schemas
100
+ GSETTINGS_SCHEMA_DIR_CONDA_BACKUP=
101
+ HOME=/home/yangyaodong
102
+ LANG=C.UTF-8
103
+ LD_LIBRARY_PATH=/usr/mpi/gcc/openmpi-4.1.7a1/lib:/usr/local/cuda/lib64:/usr/local/cuda/lib64:/cm/shared/apps/slurm/current/lib64/slurm:/cm/shared/apps/slurm/current/lib64
104
+ LD_LIBRARY_PATH_modshare=/cm/shared/apps/slurm/current/lib64:1:/usr/mpi/gcc/openmpi-4.1.7a1/lib:1:/cm/shared/apps/slurm/current/lib64/slurm:1:/usr/local/cuda/lib64:1
105
+ LD_RUN_PATH=/usr/mpi/gcc/openmpi-4.1.7a1/lib
106
+ LD_RUN_PATH_modshare=/usr/mpi/gcc/openmpi-4.1.7a1/lib:1
107
+ LESSCLOSE=/usr/bin/lesspipe %s %s
108
+ LESSOPEN=| /usr/bin/lesspipe %s
109
+ LIBRARY_PATH=/cm/shared/apps/slurm/current/lib64/slurm:/cm/shared/apps/slurm/current/lib64
110
+ LIBRARY_PATH_modshare=/cm/shared/apps/slurm/current/lib64:1:/cm/shared/apps/slurm/current/lib64/slurm:1
111
+ LOADEDMODULES=slurm/slurm/23.02.6:gcc/64/4.1.7a1
112
+ LOADEDMODULES_modshare=slurm/slurm/23.02.6:1:gcc/64/4.1.7a1:1
113
+ LOCAL_RANK=0
114
+ LOCAL_SIZE=8
115
+ LOGLEVEL=WARNING
116
+ LOGNAME=yangyaodong
117
+ LS_COLORS=rs=0:di=01;34:ln=01;36:mh=00:pi=40;33:so=01;35:do=01;35:bd=40;33;01:cd=40;33;01:or=40;31;01:mi=00:su=37;41:sg=30;43:ca=30;41:tw=30;42:ow=34;42:st=37;44:ex=01;32:*.tar=01;31:*.tgz=01;31:*.arc=01;31:*.arj=01;31:*.taz=01;31:*.lha=01;31:*.lz4=01;31:*.lzh=01;31:*.lzma=01;31:*.tlz=01;31:*.txz=01;31:*.tzo=01;31:*.t7z=01;31:*.zip=01;31:*.z=01;31:*.dz=01;31:*.gz=01;31:*.lrz=01;31:*.lz=01;31:*.lzo=01;31:*.xz=01;31:*.zst=01;31:*.tzst=01;31:*.bz2=01;31:*.bz=01;31:*.tbz=01;31:*.tbz2=01;31:*.tz=01;31:*.deb=01;31:*.rpm=01;31:*.jar=01;31:*.war=01;31:*.ear=01;31:*.sar=01;31:*.rar=01;31:*.alz=01;31:*.ace=01;31:*.zoo=01;31:*.cpio=01;31:*.7z=01;31:*.rz=01;31:*.cab=01;31:*.wim=01;31:*.swm=01;31:*.dwm=01;31:*.esd=01;31:*.jpg=01;35:*.jpeg=01;35:*.mjpg=01;35:*.mjpeg=01;35:*.gif=01;35:*.bmp=01;35:*.pbm=01;35:*.pgm=01;35:*.ppm=01;35:*.tga=01;35:*.xbm=01;35:*.xpm=01;35:*.tif=01;35:*.tiff=01;35:*.png=01;35:*.svg=01;35:*.svgz=01;35:*.mng=01;35:*.pcx=01;35:*.mov=01;35:*.mpg=01;35:*.mpeg=01;35:*.m2v=01;35:*.mkv=01;35:*.webm=01;35:*.webp=01;35:*.ogm=01;35:*.mp4=01;35:*.m4v=01;35:*.mp4v=01;35:*.vob=01;35:*.qt=01;35:*.nuv=01;35:*.wmv=01;35:*.asf=01;35:*.rm=01;35:*.rmvb=01;35:*.flc=01;35:*.avi=01;35:*.fli=01;35:*.flv=01;35:*.gl=01;35:*.dl=01;35:*.xcf=01;35:*.xwd=01;35:*.yuv=01;35:*.cgm=01;35:*.emf=01;35:*.ogv=01;35:*.ogx=01;35:*.aac=00;36:*.au=00;36:*.flac=00;36:*.m4a=00;36:*.mid=00;36:*.midi=00;36:*.mka=00;36:*.mp3=00;36:*.mpc=00;36:*.ogg=00;36:*.ra=00;36:*.wav=00;36:*.oga=00;36:*.opus=00;36:*.spx=00;36:*.xspf=00;36:
118
+ MANPATH=/usr/mpi/gcc/openmpi-4.1.7a1/share/man:/cm/shared/apps/slurm/current/man:/cm/local/apps/environment-modules/4.5.3/share/man:/usr/local/man:/usr/local/share/man:/usr/share/man:/cm/local/apps/environment-modules/current/share/man:/cm/local/apps/environment-modules/current/share/man
119
+ MANPATH_modshare=/usr/local/share/man:1:/usr/mpi/gcc/openmpi-4.1.7a1/share/man:1:/cm/local/apps/environment-modules/current/share/man:1:/cm/local/apps/environment-modules/4.5.3/share/man:1:/usr/local/man:1:/usr/share/man:1:/cm/shared/apps/slurm/current/man:1
120
+ MASTER_ADDR=127.0.0.1
121
+ MASTER_PORT=50216
122
+ MIG_PARTED_CHECKPOINT_FILE=/var/lib/nvidia-mig-manager/checkpoint.json
123
+ MIG_PARTED_CONFIG_FILE=/etc/nvidia-mig-manager/config.yaml
124
+ MIG_PARTED_HOOKS_FILE=/etc/nvidia-mig-manager/hooks.yaml
125
+ MKL_INTERFACE_LAYER=LP64,GNU
126
+ MODULEPATH=/cm/local/modulefiles:/cm/shared/modulefiles
127
+ MODULESHOME=/cm/local/apps/environment-modules/4.5.3
128
+ MODULES_CMD=/cm/local/apps/environment-modules/4.5.3/libexec/modulecmd.tcl
129
+ MODULES_SET_SHELL_STARTUP=0
130
+ MOTD_SHOWN=pam
131
+ MPI_HOME=/usr/mpi/gcc/openmpi-4.1.7a1
132
+ MPI_RUN=/usr/mpi/gcc/openmpi-4.1.7a1/bin/mpirun
133
+ OLDPWD=/aifs4su/yaodong/projects/hantao/dev_cham/align-anything/projects/chameleon
134
+ PATH=/aifs4su/yaodong/google-cloud-sdk/bin:/aifs4su/yaodong/miniconda3/envs/hantao_new/bin:/aifs4su/yaodong/miniconda3/condabin:/usr/mpi/gcc/openmpi-4.1.7a1/bin:/usr/local/cuda/bin:/usr/lpp/mmfs/bin:/usr/local/cuda/bin:/opt/bin:/usr/local/cuda/bin:/usr/lpp/mmfs/bin:/cm/shared/apps/slurm/current/sbin:/cm/shared/apps/slurm/current/bin:/usr/local/cuda/bin:/opt/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin:/usr/games:/usr/local/games:/snap/bin:/sbin:/usr/sbin:/cm/local/apps/environment-modules/4.5.3/bin
135
+ PATH_modshare=/usr/mpi/gcc/openmpi-4.1.7a1/bin:1:/opt/bin/:1:/usr/bin:1:/usr/local/bin:1:/cm/shared/apps/slurm/current/bin:1:/cm/shared/apps/slurm/current/sbin:1:/bin:1:/snap/bin:1:/sbin:1:/usr/sbin:1:/cm/local/apps/environment-modules/4.5.3/bin:1:/usr/games:1:/usr/local/sbin:1:/usr/lpp/mmfs/bin:1:/usr/local/cuda/bin:1:/usr/local/games:1
136
+ PWD=/aifs4su/yaodong/projects/hantao/dev_cham/align-anything/scripts
137
+ PYTHONHASHSEED=42
138
+ PYTHONPATH=/aifs4su/yaodong/projects/hantao/dev_cham/align-anything
139
+ RANK=0
140
+ SHELL=/bin/bash
141
+ SHLVL=3
142
+ SLURM_CONF=/cm/shared/apps/slurm/var/etc/slurm/slurm.conf
143
+ SSH_CLIENT=10.33.5.36 36286 22
144
+ SSH_CONNECTION=10.33.5.36 36286 10.33.4.214 22
145
+ SSH_TTY=/dev/pts/1
146
+ TERM=screen
147
+ TERM_PROGRAM=tmux
148
+ TERM_PROGRAM_VERSION=3.2a
149
+ TMUX=/tmp/tmux-1028/default,3233837,0
150
+ TMUX_PANE=%0
151
+ TRITON_CACHE_DIR=/aifs4su/yaodong/cache/triton
152
+ USER=yangyaodong
153
+ WANDB_API_KEY=547f38af44135ca76a4f4eed9c8d135532da4960
154
+ WANDB_SERVICE=2-361042-tcp-localhost-58047
155
+ WORLD_SIZE=8
156
+ XDG_DATA_DIRS=/usr/local/share:/usr/share:/var/lib/snapd/desktop
157
+ XDG_RUNTIME_DIR=/run/user/1028
158
+ XDG_SESSION_CLASS=user
159
+ XDG_SESSION_ID=626
160
+ XDG_SESSION_TYPE=tty
161
+ XML_CATALOG_FILES=file:///aifs4su/yaodong/miniconda3/envs/hantao_new/etc/xml/catalog file:///etc/xml/catalog
162
+ _=/aifs4su/yaodong/miniconda3/envs/hantao_new/bin/deepspeed
163
+ _CE_CONDA=
164
+ _CE_M=
165
+ _LMFILES_=/cm/local/modulefiles/slurm/slurm/23.02.6:/cm/local/modulefiles/gcc/64/4.1.7a1
166
+ _LMFILES__modshare=/cm/local/modulefiles/slurm/slurm/23.02.6:1:/cm/local/modulefiles/gcc/64/4.1.7a1:1
preprocessor_config.json ADDED
@@ -0,0 +1,28 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "crop_size": {
3
+ "height": 512,
4
+ "width": 512
5
+ },
6
+ "do_center_crop": true,
7
+ "do_convert_rgb": true,
8
+ "do_normalize": true,
9
+ "do_rescale": true,
10
+ "do_resize": true,
11
+ "image_mean": [
12
+ 1.0,
13
+ 1.0,
14
+ 1.0
15
+ ],
16
+ "image_processor_type": "ChameleonImageProcessor",
17
+ "image_std": [
18
+ 1.0,
19
+ 1.0,
20
+ 1.0
21
+ ],
22
+ "processor_class": "ChameleonProcessor",
23
+ "resample": 1,
24
+ "rescale_factor": 0.0078,
25
+ "size": {
26
+ "shortest_edge": 512
27
+ }
28
+ }
processor_config.json ADDED
@@ -0,0 +1,5 @@
 
 
 
 
 
 
1
+ {
2
+ "image_seq_length": 1024,
3
+ "image_token": "<image>",
4
+ "processor_class": "ChameleonProcessor"
5
+ }
pytorch_model.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:281fb5305fc5d9528c8647f87e2ee4e918af417f338610052d09b3da0cc333fe
3
+ size 14165009930
special_tokens_map.json ADDED
@@ -0,0 +1,37 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "bos_token": {
3
+ "content": "<s>",
4
+ "lstrip": false,
5
+ "normalized": false,
6
+ "rstrip": false,
7
+ "single_word": false
8
+ },
9
+ "eos_token": {
10
+ "content": "</s>",
11
+ "lstrip": false,
12
+ "normalized": false,
13
+ "rstrip": false,
14
+ "single_word": false
15
+ },
16
+ "pad_token": {
17
+ "content": "<pad>",
18
+ "lstrip": false,
19
+ "normalized": false,
20
+ "rstrip": false,
21
+ "single_word": false
22
+ },
23
+ "sep_token": {
24
+ "content": "<reserved08706>",
25
+ "lstrip": false,
26
+ "normalized": false,
27
+ "rstrip": false,
28
+ "single_word": false
29
+ },
30
+ "unk_token": {
31
+ "content": "<unk>",
32
+ "lstrip": false,
33
+ "normalized": false,
34
+ "rstrip": false,
35
+ "single_word": false
36
+ }
37
+ }
tokenizer.json ADDED
The diff for this file is too large to render. See raw diff
 
tokenizer_config.json ADDED
The diff for this file is too large to render. See raw diff