Gaie commited on
Commit
f7308d8
1 Parent(s): de8fcce

Add files using upload-large-folder tool

Browse files
.gitattributes CHANGED
@@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
 
 
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
+ wandb/run-20241023_195332-5p9x2ymn/run-5p9x2ymn.wandb filter=lfs diff=lfs merge=lfs -text
added_tokens.json ADDED
@@ -0,0 +1,4 @@
 
 
 
 
 
1
+ {
2
+ "<image>": 32000,
3
+ "<pad>": 32001
4
+ }
arguments.yaml ADDED
@@ -0,0 +1,52 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ data_cfgs:
2
+ eval_data_files: null
3
+ eval_datasets: /home/align-anything/datasets/40k_ti2t_filtered
4
+ eval_name: null
5
+ eval_optional_args: []
6
+ eval_size: null
7
+ eval_split: train
8
+ eval_subset: null
9
+ eval_template: AA_TI2T
10
+ train_data_files: null
11
+ train_datasets: /data/align-anything/jiayi/ti2t/refine_gen_wo_res/1021_13b_2000
12
+ train_name: null
13
+ train_optional_args: []
14
+ train_size: null
15
+ train_split: train
16
+ train_subset: null
17
+ train_template: AA_TI2T_Critique
18
+ logger_cfgs:
19
+ cache_dir: null
20
+ log_project: align-anything
21
+ log_run_name: rm
22
+ log_type: wandb
23
+ output_dir: /data/align-anything/jiayi/ti2t/rm_10_22_ours_13b_2000
24
+ save_interval: 598.0
25
+ model_cfgs:
26
+ model_max_length: 2048
27
+ model_name_or_path: /data/models/llava/llava-1.5-13b-hf
28
+ trust_remote_code: true
29
+ special_tokens: null
30
+ train_cfgs:
31
+ adam_betas:
32
+ - 0.9
33
+ - 0.95
34
+ bf16: true
35
+ ds_cfgs: ds_z3_config.json
36
+ epochs: 5.0
37
+ eval_interval: 10
38
+ eval_strategy: epoch
39
+ fp16: false
40
+ freeze_language_model: false
41
+ freeze_mm_proj: false
42
+ freeze_vision_tower: true
43
+ gradient_accumulation_steps: 1
44
+ gradient_checkpointing: true
45
+ learning_rate: 3.0e-05
46
+ lr_scheduler_type: constant_with_warmup
47
+ lr_warmup_ratio: 0.03
48
+ per_device_eval_batch_size: 4
49
+ per_device_train_batch_size: 4
50
+ regularization: 0.001
51
+ seed: 42
52
+ weight_decay: 0.0
chat_template.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ {
2
+ "chat_template": "{% for message in messages %}{% if message['role'] != 'system' %}{{ message['role'].upper() + ': '}}{% endif %}{# Render all images first #}{% for content in message['content'] | selectattr('type', 'equalto', 'image') %}{{ '<image>\n' }}{% endfor %}{# Render all text next #}{% if message['role'] != 'assistant' %}{% for content in message['content'] | selectattr('type', 'equalto', 'text') %}{{ content['text'] + ' '}}{% endfor %}{% else %}{% for content in message['content'] | selectattr('type', 'equalto', 'text') %}{% generation %}{{ content['text'] + ' '}}{% endgeneration %}{% endfor %}{% endif %}{% endfor %}{% if add_generation_prompt %}{{ 'ASSISTANT:' }}{% endif %}"
3
+ }
config.json ADDED
@@ -0,0 +1,180 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "/data/models/llava/llava-1.5-13b-hf",
3
+ "architectures": [
4
+ "LlavaForConditionalGeneration"
5
+ ],
6
+ "bos_token_id": 1,
7
+ "eos_token_id": 2,
8
+ "ignore_index": -100,
9
+ "image_seq_length": 576,
10
+ "image_token_index": 32000,
11
+ "model_type": "llava",
12
+ "pad_token_id": 32001,
13
+ "projector_hidden_act": "gelu",
14
+ "text_config": {
15
+ "_name_or_path": "meta-llama/Llama-2-13b-hf",
16
+ "add_cross_attention": false,
17
+ "architectures": [
18
+ "LlamaForCausalLM"
19
+ ],
20
+ "attention_bias": false,
21
+ "attention_dropout": 0.0,
22
+ "bad_words_ids": null,
23
+ "begin_suppress_tokens": null,
24
+ "bos_token_id": 1,
25
+ "chunk_size_feed_forward": 0,
26
+ "cross_attention_hidden_size": null,
27
+ "decoder_start_token_id": null,
28
+ "diversity_penalty": 0.0,
29
+ "do_sample": false,
30
+ "early_stopping": false,
31
+ "encoder_no_repeat_ngram_size": 0,
32
+ "eos_token_id": 2,
33
+ "exponential_decay_length_penalty": null,
34
+ "finetuning_task": null,
35
+ "forced_bos_token_id": null,
36
+ "forced_eos_token_id": null,
37
+ "head_dim": 128,
38
+ "hidden_act": "silu",
39
+ "hidden_size": 5120,
40
+ "id2label": {
41
+ "0": "LABEL_0",
42
+ "1": "LABEL_1"
43
+ },
44
+ "initializer_range": 0.02,
45
+ "intermediate_size": 13824,
46
+ "is_decoder": false,
47
+ "is_encoder_decoder": false,
48
+ "label2id": {
49
+ "LABEL_0": 0,
50
+ "LABEL_1": 1
51
+ },
52
+ "length_penalty": 1.0,
53
+ "max_length": 20,
54
+ "max_position_embeddings": 4096,
55
+ "min_length": 0,
56
+ "mlp_bias": false,
57
+ "model_type": "llama",
58
+ "no_repeat_ngram_size": 0,
59
+ "num_attention_heads": 40,
60
+ "num_beam_groups": 1,
61
+ "num_beams": 1,
62
+ "num_hidden_layers": 40,
63
+ "num_key_value_heads": 40,
64
+ "num_return_sequences": 1,
65
+ "output_attentions": false,
66
+ "output_hidden_states": false,
67
+ "output_scores": false,
68
+ "pad_token_id": null,
69
+ "prefix": null,
70
+ "pretraining_tp": 1,
71
+ "problem_type": null,
72
+ "pruned_heads": {},
73
+ "remove_invalid_values": false,
74
+ "repetition_penalty": 1.0,
75
+ "return_dict": true,
76
+ "return_dict_in_generate": false,
77
+ "rms_norm_eps": 1e-05,
78
+ "rope_scaling": null,
79
+ "rope_theta": 10000.0,
80
+ "sep_token_id": null,
81
+ "suppress_tokens": null,
82
+ "task_specific_params": null,
83
+ "temperature": 1.0,
84
+ "tf_legacy_loss": false,
85
+ "tie_encoder_decoder": false,
86
+ "tie_word_embeddings": false,
87
+ "tokenizer_class": null,
88
+ "top_k": 50,
89
+ "top_p": 1.0,
90
+ "torch_dtype": "float16",
91
+ "torchscript": false,
92
+ "typical_p": 1.0,
93
+ "use_bfloat16": false,
94
+ "use_cache": true,
95
+ "vocab_size": 32064
96
+ },
97
+ "tie_word_embeddings": false,
98
+ "torch_dtype": "float16",
99
+ "transformers_version": "4.46.0.dev0",
100
+ "vision_config": {
101
+ "_name_or_path": "",
102
+ "add_cross_attention": false,
103
+ "architectures": null,
104
+ "attention_dropout": 0.0,
105
+ "bad_words_ids": null,
106
+ "begin_suppress_tokens": null,
107
+ "bos_token_id": null,
108
+ "chunk_size_feed_forward": 0,
109
+ "cross_attention_hidden_size": null,
110
+ "decoder_start_token_id": null,
111
+ "diversity_penalty": 0.0,
112
+ "do_sample": false,
113
+ "early_stopping": false,
114
+ "encoder_no_repeat_ngram_size": 0,
115
+ "eos_token_id": null,
116
+ "exponential_decay_length_penalty": null,
117
+ "finetuning_task": null,
118
+ "forced_bos_token_id": null,
119
+ "forced_eos_token_id": null,
120
+ "hidden_act": "quick_gelu",
121
+ "hidden_size": 1024,
122
+ "id2label": {
123
+ "0": "LABEL_0",
124
+ "1": "LABEL_1"
125
+ },
126
+ "image_size": 336,
127
+ "initializer_factor": 1.0,
128
+ "initializer_range": 0.02,
129
+ "intermediate_size": 4096,
130
+ "is_decoder": false,
131
+ "is_encoder_decoder": false,
132
+ "label2id": {
133
+ "LABEL_0": 0,
134
+ "LABEL_1": 1
135
+ },
136
+ "layer_norm_eps": 1e-05,
137
+ "length_penalty": 1.0,
138
+ "max_length": 20,
139
+ "min_length": 0,
140
+ "model_type": "clip_vision_model",
141
+ "no_repeat_ngram_size": 0,
142
+ "num_attention_heads": 16,
143
+ "num_beam_groups": 1,
144
+ "num_beams": 1,
145
+ "num_channels": 3,
146
+ "num_hidden_layers": 24,
147
+ "num_return_sequences": 1,
148
+ "output_attentions": false,
149
+ "output_hidden_states": false,
150
+ "output_scores": false,
151
+ "pad_token_id": null,
152
+ "patch_size": 14,
153
+ "prefix": null,
154
+ "problem_type": null,
155
+ "projection_dim": 768,
156
+ "pruned_heads": {},
157
+ "remove_invalid_values": false,
158
+ "repetition_penalty": 1.0,
159
+ "return_dict": true,
160
+ "return_dict_in_generate": false,
161
+ "sep_token_id": null,
162
+ "suppress_tokens": null,
163
+ "task_specific_params": null,
164
+ "temperature": 1.0,
165
+ "tf_legacy_loss": false,
166
+ "tie_encoder_decoder": false,
167
+ "tie_word_embeddings": true,
168
+ "tokenizer_class": null,
169
+ "top_k": 50,
170
+ "top_p": 1.0,
171
+ "torch_dtype": null,
172
+ "torchscript": false,
173
+ "typical_p": 1.0,
174
+ "use_bfloat16": false,
175
+ "vocab_size": 32000
176
+ },
177
+ "vision_feature_layer": -2,
178
+ "vision_feature_select_strategy": "default",
179
+ "vocab_size": 32064
180
+ }
environ.txt ADDED
@@ -0,0 +1,156 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ADDR2LINE=/home/align-anything/miniconda3/envs/jy-align/bin/x86_64-conda-linux-gnu-addr2line
2
+ AR=/home/align-anything/miniconda3/envs/jy-align/bin/x86_64-conda-linux-gnu-ar
3
+ AS=/home/align-anything/miniconda3/envs/jy-align/bin/x86_64-conda-linux-gnu-as
4
+ BROWSER=/home/align-anything/.cursor-server/cli/servers/Stable-51c8aff7cb5a89f4a0e462fbacab938bdbfaf140/server/bin/helpers/browser.sh
5
+ BUILD=x86_64-conda-linux-gnu
6
+ CC=/home/align-anything/miniconda3/envs/jy-align/bin/x86_64-conda-linux-gnu-cc
7
+ CC_FOR_BUILD=/home/align-anything/miniconda3/envs/jy-align/bin/x86_64-conda-linux-gnu-cc
8
+ CFLAGS=-march=nocona -mtune=haswell -ftree-vectorize -fPIC -fstack-protector-strong -fno-plt -O2 -ffunction-sections -pipe -isystem /home/align-anything/miniconda3/envs/jy-align/include -march=nocona -mtune=haswell -ftree-vectorize -fPIC -fstack-protector-strong -fno-plt -O2 -ffunction-sections -pipe -isystem /data/align-anything/miniconda3/envs/jy-a/include -march=nocona -mtune=haswell -ftree-vectorize -fPIC -fstack-protector-strong -fno-plt -O2 -ffunction-sections -pipe -isystem /data/align-anything/miniconda3/envs/jy-a/include -I/data/align-anything/miniconda3/envs/jy-a/targets/x86_64-linux/include -L/data/align-anything/miniconda3/envs/jy-a/targets/x86_64-linux/lib -L/data/align-anything/miniconda3/envs/jy-a/targets/x86_64-linux/lib/stubs -I/home/align-anything/miniconda3/envs/jy-align/targets/x86_64-linux/include -L/home/align-anything/miniconda3/envs/jy-align/targets/x86_64-linux/lib -L/home/align-anything/miniconda3/envs/jy-align/targets/x86_64-linux/lib/stubs
9
+ CMAKE_ARGS=-DCMAKE_AR=/home/align-anything/miniconda3/envs/jy-align/bin/x86_64-conda-linux-gnu-ar -DCMAKE_CXX_COMPILER_AR=/home/align-anything/miniconda3/envs/jy-align/bin/x86_64-conda-linux-gnu-gcc-ar -DCMAKE_C_COMPILER_AR=/home/align-anything/miniconda3/envs/jy-align/bin/x86_64-conda-linux-gnu-gcc-ar -DCMAKE_RANLIB=/home/align-anything/miniconda3/envs/jy-align/bin/x86_64-conda-linux-gnu-ranlib -DCMAKE_CXX_COMPILER_RANLIB=/home/align-anything/miniconda3/envs/jy-align/bin/x86_64-conda-linux-gnu-gcc-ranlib -DCMAKE_C_COMPILER_RANLIB=/home/align-anything/miniconda3/envs/jy-align/bin/x86_64-conda-linux-gnu-gcc-ranlib -DCMAKE_LINKER=/home/align-anything/miniconda3/envs/jy-align/bin/x86_64-conda-linux-gnu-ld -DCMAKE_STRIP=/home/align-anything/miniconda3/envs/jy-align/bin/x86_64-conda-linux-gnu-strip -DCMAKE_BUILD_TYPE=Release
10
+ CMAKE_PREFIX_PATH=/home/align-anything/miniconda3/envs/jy-align:/home/align-anything/miniconda3/envs/jy-align/x86_64-conda-linux-gnu/sysroot/usr
11
+ COLORTERM=truecolor
12
+ CONDA_BACKUP_ADDR2LINE=/data/align-anything/miniconda3/envs/jy-a/bin/x86_64-conda-linux-gnu-addr2line
13
+ CONDA_BACKUP_AR=/data/align-anything/miniconda3/envs/jy-a/bin/x86_64-conda-linux-gnu-ar
14
+ CONDA_BACKUP_AS=/data/align-anything/miniconda3/envs/jy-a/bin/x86_64-conda-linux-gnu-as
15
+ CONDA_BACKUP_BUILD=x86_64-conda-linux-gnu
16
+ CONDA_BACKUP_CC=/data/align-anything/miniconda3/envs/jy-a/bin/x86_64-conda-linux-gnu-cc
17
+ CONDA_BACKUP_CC_FOR_BUILD=/data/align-anything/miniconda3/envs/jy-a/bin/x86_64-conda-linux-gnu-cc
18
+ CONDA_BACKUP_CFLAGS=-march=nocona -mtune=haswell -ftree-vectorize -fPIC -fstack-protector-strong -fno-plt -O2 -ffunction-sections -pipe -isystem /data/align-anything/miniconda3/envs/jy-a/include -march=nocona -mtune=haswell -ftree-vectorize -fPIC -fstack-protector-strong -fno-plt -O2 -ffunction-sections -pipe -isystem /data/align-anything/miniconda3/envs/jy-a/include -I/data/align-anything/miniconda3/envs/jy-a/targets/x86_64-linux/include -L/data/align-anything/miniconda3/envs/jy-a/targets/x86_64-linux/lib -L/data/align-anything/miniconda3/envs/jy-a/targets/x86_64-linux/lib/stubs
19
+ CONDA_BACKUP_CMAKE_PREFIX_PATH=/data/align-anything/miniconda3/envs/jy-a:/data/align-anything/miniconda3/envs/jy-a/x86_64-conda-linux-gnu/sysroot/usr
20
+ CONDA_BACKUP_CONDA_BUILD_SYSROOT=/data/align-anything/miniconda3/envs/jy-a/x86_64-conda-linux-gnu/sysroot
21
+ CONDA_BACKUP_CONDA_TOOLCHAIN_BUILD=x86_64-conda-linux-gnu
22
+ CONDA_BACKUP_CONDA_TOOLCHAIN_HOST=x86_64-conda-linux-gnu
23
+ CONDA_BACKUP_CPP=/data/align-anything/miniconda3/envs/jy-a/bin/x86_64-conda-linux-gnu-cpp
24
+ CONDA_BACKUP_CPPFLAGS=-DNDEBUG -D_FORTIFY_SOURCE=2 -O2 -isystem /data/align-anything/miniconda3/envs/jy-a/include -DNDEBUG -D_FORTIFY_SOURCE=2 -O2 -isystem /data/align-anything/miniconda3/envs/jy-a/include -I/data/align-anything/miniconda3/envs/jy-a/targets/x86_64-linux/include -L/data/align-anything/miniconda3/envs/jy-a/targets/x86_64-linux/lib -L/data/align-anything/miniconda3/envs/jy-a/targets/x86_64-linux/lib/stubs
25
+ CONDA_BACKUP_CXX=/data/align-anything/miniconda3/envs/jy-a/bin/x86_64-conda-linux-gnu-c++
26
+ CONDA_BACKUP_CXXFILT=/data/align-anything/miniconda3/envs/jy-a/bin/x86_64-conda-linux-gnu-c++filt
27
+ CONDA_BACKUP_CXXFLAGS=-fvisibility-inlines-hidden -fmessage-length=0 -march=nocona -mtune=haswell -ftree-vectorize -fPIC -fstack-protector-strong -fno-plt -O2 -ffunction-sections -pipe -isystem /data/align-anything/miniconda3/envs/jy-a/include -fvisibility-inlines-hidden -fmessage-length=0 -march=nocona -mtune=haswell -ftree-vectorize -fPIC -fstack-protector-strong -fno-plt -O2 -ffunction-sections -pipe -isystem /data/align-anything/miniconda3/envs/jy-a/include -I/data/align-anything/miniconda3/envs/jy-a/targets/x86_64-linux/include -L/data/align-anything/miniconda3/envs/jy-a/targets/x86_64-linux/lib -L/data/align-anything/miniconda3/envs/jy-a/targets/x86_64-linux/lib/stubs
28
+ CONDA_BACKUP_CXX_FOR_BUILD=/data/align-anything/miniconda3/envs/jy-a/bin/x86_64-conda-linux-gnu-c++
29
+ CONDA_BACKUP_DEBUG_CFLAGS=-march=nocona -mtune=haswell -ftree-vectorize -fPIC -fstack-protector-all -fno-plt -Og -g -Wall -Wextra -fvar-tracking-assignments -ffunction-sections -pipe -isystem /data/align-anything/miniconda3/envs/jy-a/include -march=nocona -mtune=haswell -ftree-vectorize -fPIC -fstack-protector-all -fno-plt -Og -g -Wall -Wextra -fvar-tracking-assignments -ffunction-sections -pipe -isystem /data/align-anything/miniconda3/envs/jy-a/include
30
+ CONDA_BACKUP_DEBUG_CPPFLAGS=-D_DEBUG -D_FORTIFY_SOURCE=2 -Og -isystem /data/align-anything/miniconda3/envs/jy-a/include -D_DEBUG -D_FORTIFY_SOURCE=2 -Og -isystem /data/align-anything/miniconda3/envs/jy-a/include
31
+ CONDA_BACKUP_DEBUG_CXXFLAGS=-fvisibility-inlines-hidden -fmessage-length=0 -march=nocona -mtune=haswell -ftree-vectorize -fPIC -fstack-protector-all -fno-plt -Og -g -Wall -Wextra -fvar-tracking-assignments -ffunction-sections -pipe -isystem /data/align-anything/miniconda3/envs/jy-a/include -fvisibility-inlines-hidden -fmessage-length=0 -march=nocona -mtune=haswell -ftree-vectorize -fPIC -fstack-protector-all -fno-plt -Og -g -Wall -Wextra -fvar-tracking-assignments -ffunction-sections -pipe -isystem /data/align-anything/miniconda3/envs/jy-a/include
32
+ CONDA_BACKUP_DWP=/data/align-anything/miniconda3/envs/jy-a/bin/x86_64-conda-linux-gnu-dwp
33
+ CONDA_BACKUP_ELFEDIT=/data/align-anything/miniconda3/envs/jy-a/bin/x86_64-conda-linux-gnu-elfedit
34
+ CONDA_BACKUP_GCC=/data/align-anything/miniconda3/envs/jy-a/bin/x86_64-conda-linux-gnu-gcc
35
+ CONDA_BACKUP_GCC_AR=/data/align-anything/miniconda3/envs/jy-a/bin/x86_64-conda-linux-gnu-gcc-ar
36
+ CONDA_BACKUP_GCC_NM=/data/align-anything/miniconda3/envs/jy-a/bin/x86_64-conda-linux-gnu-gcc-nm
37
+ CONDA_BACKUP_GCC_RANLIB=/data/align-anything/miniconda3/envs/jy-a/bin/x86_64-conda-linux-gnu-gcc-ranlib
38
+ CONDA_BACKUP_GPROF=/data/align-anything/miniconda3/envs/jy-a/bin/x86_64-conda-linux-gnu-gprof
39
+ CONDA_BACKUP_GXX=/data/align-anything/miniconda3/envs/jy-a/bin/x86_64-conda-linux-gnu-g++
40
+ CONDA_BACKUP_HOST=x86_64-conda-linux-gnu
41
+ CONDA_BACKUP_LD=/data/align-anything/miniconda3/envs/jy-a/bin/x86_64-conda-linux-gnu-ld
42
+ CONDA_BACKUP_LDFLAGS=-Wl,-O2 -Wl,--sort-common -Wl,--as-needed -Wl,-z,relro -Wl,-z,now -Wl,--disable-new-dtags -Wl,--gc-sections -Wl,--allow-shlib-undefined -Wl,-rpath,/data/align-anything/miniconda3/envs/jy-a/lib -Wl,-rpath-link,/data/align-anything/miniconda3/envs/jy-a/lib -L/data/align-anything/miniconda3/envs/jy-a/lib -Wl,-O2 -Wl,--sort-common -Wl,--as-needed -Wl,-z,relro -Wl,-z,now -Wl,--disable-new-dtags -Wl,--gc-sections -Wl,--allow-shlib-undefined -Wl,-rpath,/data/align-anything/miniconda3/envs/jy-a/lib -Wl,-rpath-link,/data/align-anything/miniconda3/envs/jy-a/lib -L/data/align-anything/miniconda3/envs/jy-a/lib -L/data/align-anything/miniconda3/envs/jy-a/targets/x86_64-linux/lib -L/data/align-anything/miniconda3/envs/jy-a/targets/x86_64-linux/lib/stubs
43
+ CONDA_BACKUP_LD_GOLD=/data/align-anything/miniconda3/envs/jy-a/bin/x86_64-conda-linux-gnu-ld.gold
44
+ CONDA_BACKUP_NM=/data/align-anything/miniconda3/envs/jy-a/bin/x86_64-conda-linux-gnu-nm
45
+ CONDA_BACKUP_OBJCOPY=/data/align-anything/miniconda3/envs/jy-a/bin/x86_64-conda-linux-gnu-objcopy
46
+ CONDA_BACKUP_OBJDUMP=/data/align-anything/miniconda3/envs/jy-a/bin/x86_64-conda-linux-gnu-objdump
47
+ CONDA_BACKUP_RANLIB=/data/align-anything/miniconda3/envs/jy-a/bin/x86_64-conda-linux-gnu-ranlib
48
+ CONDA_BACKUP_READELF=/data/align-anything/miniconda3/envs/jy-a/bin/x86_64-conda-linux-gnu-readelf
49
+ CONDA_BACKUP_SIZE=/data/align-anything/miniconda3/envs/jy-a/bin/x86_64-conda-linux-gnu-size
50
+ CONDA_BACKUP_STRINGS=/data/align-anything/miniconda3/envs/jy-a/bin/x86_64-conda-linux-gnu-strings
51
+ CONDA_BACKUP_STRIP=/data/align-anything/miniconda3/envs/jy-a/bin/x86_64-conda-linux-gnu-strip
52
+ CONDA_BACKUP_build_alias=x86_64-conda-linux-gnu
53
+ CONDA_BACKUP_host_alias=x86_64-conda-linux-gnu
54
+ CONDA_BUILD_SYSROOT=/home/align-anything/miniconda3/envs/jy-align/x86_64-conda-linux-gnu/sysroot
55
+ CONDA_DEFAULT_ENV=jy-align
56
+ CONDA_EXE=/home/align-anything/miniconda3/bin/conda
57
+ CONDA_PREFIX=/home/align-anything/miniconda3/envs/jy-align
58
+ CONDA_PREFIX_1=/home/align-anything/miniconda3
59
+ CONDA_PREFIX_2=/data/align-anything/miniconda3/envs/jy-a
60
+ CONDA_PREFIX_3=/home/align-anything/miniconda3
61
+ CONDA_PROMPT_MODIFIER=(jy-align)
62
+ CONDA_PYTHON_EXE=/home/align-anything/miniconda3/bin/python
63
+ CONDA_ROOT=/home/align-anything/miniconda3
64
+ CONDA_SHLVL=4
65
+ CONDA_TOOLCHAIN_BUILD=x86_64-conda-linux-gnu
66
+ CONDA_TOOLCHAIN_HOST=x86_64-conda-linux-gnu
67
+ CPP=/home/align-anything/miniconda3/envs/jy-align/bin/x86_64-conda-linux-gnu-cpp
68
+ CPPFLAGS=-DNDEBUG -D_FORTIFY_SOURCE=2 -O2 -isystem /home/align-anything/miniconda3/envs/jy-align/include -DNDEBUG -D_FORTIFY_SOURCE=2 -O2 -isystem /data/align-anything/miniconda3/envs/jy-a/include -DNDEBUG -D_FORTIFY_SOURCE=2 -O2 -isystem /data/align-anything/miniconda3/envs/jy-a/include -I/data/align-anything/miniconda3/envs/jy-a/targets/x86_64-linux/include -L/data/align-anything/miniconda3/envs/jy-a/targets/x86_64-linux/lib -L/data/align-anything/miniconda3/envs/jy-a/targets/x86_64-linux/lib/stubs -I/home/align-anything/miniconda3/envs/jy-align/targets/x86_64-linux/include -L/home/align-anything/miniconda3/envs/jy-align/targets/x86_64-linux/lib -L/home/align-anything/miniconda3/envs/jy-align/targets/x86_64-linux/lib/stubs
69
+ CROSS_RANK=0
70
+ CROSS_SIZE=1
71
+ CUDA_MODULE_LOADING=LAZY
72
+ CUDA_VISIBLE_DEVICES=0,1,2,3,4,5,6,7
73
+ CXX=/home/align-anything/miniconda3/envs/jy-align/bin/x86_64-conda-linux-gnu-c++
74
+ CXXFILT=/home/align-anything/miniconda3/envs/jy-align/bin/x86_64-conda-linux-gnu-c++filt
75
+ CXXFLAGS=-fvisibility-inlines-hidden -fmessage-length=0 -march=nocona -mtune=haswell -ftree-vectorize -fPIC -fstack-protector-strong -fno-plt -O2 -ffunction-sections -pipe -isystem /home/align-anything/miniconda3/envs/jy-align/include -fvisibility-inlines-hidden -fmessage-length=0 -march=nocona -mtune=haswell -ftree-vectorize -fPIC -fstack-protector-strong -fno-plt -O2 -ffunction-sections -pipe -isystem /data/align-anything/miniconda3/envs/jy-a/include -fvisibility-inlines-hidden -fmessage-length=0 -march=nocona -mtune=haswell -ftree-vectorize -fPIC -fstack-protector-strong -fno-plt -O2 -ffunction-sections -pipe -isystem /data/align-anything/miniconda3/envs/jy-a/include -I/data/align-anything/miniconda3/envs/jy-a/targets/x86_64-linux/include -L/data/align-anything/miniconda3/envs/jy-a/targets/x86_64-linux/lib -L/data/align-anything/miniconda3/envs/jy-a/targets/x86_64-linux/lib/stubs -I/home/align-anything/miniconda3/envs/jy-align/targets/x86_64-linux/include -L/home/align-anything/miniconda3/envs/jy-align/targets/x86_64-linux/lib -L/home/align-anything/miniconda3/envs/jy-align/targets/x86_64-linux/lib/stubs
76
+ CXX_FOR_BUILD=/home/align-anything/miniconda3/envs/jy-align/bin/x86_64-conda-linux-gnu-c++
77
+ DBUS_SESSION_BUS_ADDRESS=unix:path=/run/user/2000/bus
78
+ DEBUG_CFLAGS=-march=nocona -mtune=haswell -ftree-vectorize -fPIC -fstack-protector-all -fno-plt -Og -g -Wall -Wextra -fvar-tracking-assignments -ffunction-sections -pipe -isystem /home/align-anything/miniconda3/envs/jy-align/include -march=nocona -mtune=haswell -ftree-vectorize -fPIC -fstack-protector-all -fno-plt -Og -g -Wall -Wextra -fvar-tracking-assignments -ffunction-sections -pipe -isystem /data/align-anything/miniconda3/envs/jy-a/include -march=nocona -mtune=haswell -ftree-vectorize -fPIC -fstack-protector-all -fno-plt -Og -g -Wall -Wextra -fvar-tracking-assignments -ffunction-sections -pipe -isystem /data/align-anything/miniconda3/envs/jy-a/include
79
+ DEBUG_CPPFLAGS=-D_DEBUG -D_FORTIFY_SOURCE=2 -Og -isystem /home/align-anything/miniconda3/envs/jy-align/include -D_DEBUG -D_FORTIFY_SOURCE=2 -Og -isystem /data/align-anything/miniconda3/envs/jy-a/include -D_DEBUG -D_FORTIFY_SOURCE=2 -Og -isystem /data/align-anything/miniconda3/envs/jy-a/include
80
+ DEBUG_CXXFLAGS=-fvisibility-inlines-hidden -fmessage-length=0 -march=nocona -mtune=haswell -ftree-vectorize -fPIC -fstack-protector-all -fno-plt -Og -g -Wall -Wextra -fvar-tracking-assignments -ffunction-sections -pipe -isystem /home/align-anything/miniconda3/envs/jy-align/include -fvisibility-inlines-hidden -fmessage-length=0 -march=nocona -mtune=haswell -ftree-vectorize -fPIC -fstack-protector-all -fno-plt -Og -g -Wall -Wextra -fvar-tracking-assignments -ffunction-sections -pipe -isystem /data/align-anything/miniconda3/envs/jy-a/include -fvisibility-inlines-hidden -fmessage-length=0 -march=nocona -mtune=haswell -ftree-vectorize -fPIC -fstack-protector-all -fno-plt -Og -g -Wall -Wextra -fvar-tracking-assignments -ffunction-sections -pipe -isystem /data/align-anything/miniconda3/envs/jy-a/include
81
+ DWP=/home/align-anything/miniconda3/envs/jy-align/bin/x86_64-conda-linux-gnu-dwp
82
+ ELFEDIT=/home/align-anything/miniconda3/envs/jy-align/bin/x86_64-conda-linux-gnu-elfedit
83
+ GCC=/home/align-anything/miniconda3/envs/jy-align/bin/x86_64-conda-linux-gnu-gcc
84
+ GCC_AR=/home/align-anything/miniconda3/envs/jy-align/bin/x86_64-conda-linux-gnu-gcc-ar
85
+ GCC_NM=/home/align-anything/miniconda3/envs/jy-align/bin/x86_64-conda-linux-gnu-gcc-nm
86
+ GCC_RANLIB=/home/align-anything/miniconda3/envs/jy-align/bin/x86_64-conda-linux-gnu-gcc-ranlib
87
+ GIT_ASKPASS=/home/align-anything/.cursor-server/cli/servers/Stable-51c8aff7cb5a89f4a0e462fbacab938bdbfaf140/server/extensions/git/dist/askpass.sh
88
+ GPROF=/home/align-anything/miniconda3/envs/jy-align/bin/x86_64-conda-linux-gnu-gprof
89
+ GXX=/home/align-anything/miniconda3/envs/jy-align/bin/x86_64-conda-linux-gnu-g++
90
+ HOME=/home/align-anything
91
+ HOST=x86_64-conda-linux-gnu
92
+ KMP_DUPLICATE_LIB_OK=True
93
+ LANG=en_US.UTF-8
94
+ LD=/home/align-anything/miniconda3/envs/jy-align/bin/x86_64-conda-linux-gnu-ld
95
+ LDFLAGS=-Wl,-O2 -Wl,--sort-common -Wl,--as-needed -Wl,-z,relro -Wl,-z,now -Wl,--disable-new-dtags -Wl,--gc-sections -Wl,--allow-shlib-undefined -Wl,-rpath,/home/align-anything/miniconda3/envs/jy-align/lib -Wl,-rpath-link,/home/align-anything/miniconda3/envs/jy-align/lib -L/home/align-anything/miniconda3/envs/jy-align/lib -Wl,-O2 -Wl,--sort-common -Wl,--as-needed -Wl,-z,relro -Wl,-z,now -Wl,--disable-new-dtags -Wl,--gc-sections -Wl,--allow-shlib-undefined -Wl,-rpath,/data/align-anything/miniconda3/envs/jy-a/lib -Wl,-rpath-link,/data/align-anything/miniconda3/envs/jy-a/lib -L/data/align-anything/miniconda3/envs/jy-a/lib -Wl,-O2 -Wl,--sort-common -Wl,--as-needed -Wl,-z,relro -Wl,-z,now -Wl,--disable-new-dtags -Wl,--gc-sections -Wl,--allow-shlib-undefined -Wl,-rpath,/data/align-anything/miniconda3/envs/jy-a/lib -Wl,-rpath-link,/data/align-anything/miniconda3/envs/jy-a/lib -L/data/align-anything/miniconda3/envs/jy-a/lib -L/data/align-anything/miniconda3/envs/jy-a/targets/x86_64-linux/lib -L/data/align-anything/miniconda3/envs/jy-a/targets/x86_64-linux/lib/stubs -L/home/align-anything/miniconda3/envs/jy-align/targets/x86_64-linux/lib -L/home/align-anything/miniconda3/envs/jy-align/targets/x86_64-linux/lib/stubs
96
+ LD_GOLD=/home/align-anything/miniconda3/envs/jy-align/bin/x86_64-conda-linux-gnu-ld.gold
97
+ LD_LIBRARY_PATH=/home/align-anything/miniconda3/envs/jy-align/lib/python3.11/site-packages/cv2/../../lib64:
98
+ LESSCLOSE=/usr/bin/lesspipe %s %s
99
+ LESSOPEN=| /usr/bin/lesspipe %s
100
+ LOCAL_RANK=0
101
+ LOCAL_SIZE=8
102
+ LOGLEVEL=WARNING
103
+ LOGNAME=align-anything
104
+ LS_COLORS=rs=0:di=01;34:ln=01;36:mh=00:pi=40;33:so=01;35:do=01;35:bd=40;33;01:cd=40;33;01:or=40;31;01:mi=00:su=37;41:sg=30;43:ca=30;41:tw=30;42:ow=34;42:st=37;44:ex=01;32:*.tar=01;31:*.tgz=01;31:*.arc=01;31:*.arj=01;31:*.taz=01;31:*.lha=01;31:*.lz4=01;31:*.lzh=01;31:*.lzma=01;31:*.tlz=01;31:*.txz=01;31:*.tzo=01;31:*.t7z=01;31:*.zip=01;31:*.z=01;31:*.dz=01;31:*.gz=01;31:*.lrz=01;31:*.lz=01;31:*.lzo=01;31:*.xz=01;31:*.zst=01;31:*.tzst=01;31:*.bz2=01;31:*.bz=01;31:*.tbz=01;31:*.tbz2=01;31:*.tz=01;31:*.deb=01;31:*.rpm=01;31:*.jar=01;31:*.war=01;31:*.ear=01;31:*.sar=01;31:*.rar=01;31:*.alz=01;31:*.ace=01;31:*.zoo=01;31:*.cpio=01;31:*.7z=01;31:*.rz=01;31:*.cab=01;31:*.wim=01;31:*.swm=01;31:*.dwm=01;31:*.esd=01;31:*.jpg=01;35:*.jpeg=01;35:*.mjpg=01;35:*.mjpeg=01;35:*.gif=01;35:*.bmp=01;35:*.pbm=01;35:*.pgm=01;35:*.ppm=01;35:*.tga=01;35:*.xbm=01;35:*.xpm=01;35:*.tif=01;35:*.tiff=01;35:*.png=01;35:*.svg=01;35:*.svgz=01;35:*.mng=01;35:*.pcx=01;35:*.mov=01;35:*.mpg=01;35:*.mpeg=01;35:*.m2v=01;35:*.mkv=01;35:*.webm=01;35:*.ogm=01;35:*.mp4=01;35:*.m4v=01;35:*.mp4v=01;35:*.vob=01;35:*.qt=01;35:*.nuv=01;35:*.wmv=01;35:*.asf=01;35:*.rm=01;35:*.rmvb=01;35:*.flc=01;35:*.avi=01;35:*.fli=01;35:*.flv=01;35:*.gl=01;35:*.dl=01;35:*.xcf=01;35:*.xwd=01;35:*.yuv=01;35:*.cgm=01;35:*.emf=01;35:*.ogv=01;35:*.ogx=01;35:*.aac=00;36:*.au=00;36:*.flac=00;36:*.m4a=00;36:*.mid=00;36:*.midi=00;36:*.mka=00;36:*.mp3=00;36:*.mpc=00;36:*.ogg=00;36:*.ra=00;36:*.wav=00;36:*.oga=00;36:*.opus=00;36:*.spx=00;36:*.xspf=00;36:
105
+ MASTER_ADDR=127.0.0.1
106
+ MASTER_PORT=19716
107
+ MESON_ARGS=-Dbuildtype=release
108
+ MOTD_SHOWN=pam
109
+ NM=/home/align-anything/miniconda3/envs/jy-align/bin/x86_64-conda-linux-gnu-nm
110
+ NVCC_PREPEND_FLAGS= -ccbin=/data/align-anything/miniconda3/envs/jy-a/bin/x86_64-conda-linux-gnu-c++ -ccbin=/home/align-anything/miniconda3/envs/jy-align/bin/x86_64-conda-linux-gnu-c++
111
+ NVCC_PREPEND_FLAGS_BACKUP= -ccbin=/data/align-anything/miniconda3/envs/jy-a/bin/x86_64-conda-linux-gnu-c++
112
+ OBJCOPY=/home/align-anything/miniconda3/envs/jy-align/bin/x86_64-conda-linux-gnu-objcopy
113
+ OBJDUMP=/home/align-anything/miniconda3/envs/jy-align/bin/x86_64-conda-linux-gnu-objdump
114
+ OLDPWD=/data/align-anything/jiayi/ti2t/ml-mia-bench
115
+ PATH=/home/align-anything/miniconda3/envs/jy-align/bin:/home/align-anything/.cursor-server/cli/servers/Stable-949de58bd3d85d530972cac2dffc4feb9eee1e40/server/bin/remote-cli:/home/align-anything/miniconda3/envs/jy-align/bin:/home/align-anything/miniconda3/condabin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin:/usr/games:/usr/local/games:/snap/bin:/home/align-anything/.cursor-server/cli/servers/Stable-949de58bd3d85d530972cac2dffc4feb9eee1e40/server/bin/remote-cli:/home/align-anything/miniconda3/bin:/home/align-anything/miniconda3/condabin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin:/usr/games:/usr/local/games:/snap/bin:/home/align-anything/.cursor-server/cli/servers/Stable-949de58bd3d85d530972cac2dffc4feb9eee1e40/server/bin/remote-cli:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin:/usr/games:/usr/local/games:/snap/bin
116
+ PWD=/home/align-anything/align-anything/local_scripts
117
+ PYGAME_HIDE_SUPPORT_PROMPT=1
118
+ PYTHONHASHSEED=42
119
+ PYTHONPATH=/home/align-anything/align-anything
120
+ RANK=0
121
+ RANLIB=/home/align-anything/miniconda3/envs/jy-align/bin/x86_64-conda-linux-gnu-ranlib
122
+ READELF=/home/align-anything/miniconda3/envs/jy-align/bin/x86_64-conda-linux-gnu-readelf
123
+ SHELL=/bin/bash
124
+ SHLVL=3
125
+ SIZE=/home/align-anything/miniconda3/envs/jy-align/bin/x86_64-conda-linux-gnu-size
126
+ SSH_CLIENT=117.136.0.149 36325 30400
127
+ SSH_CONNECTION=222.129.2.20 6039 10.10.212.194 30400
128
+ SSL_CERT_DIR=/usr/lib/ssl/certs
129
+ SSL_CERT_FILE=/usr/lib/ssl/certs/ca-certificates.crt
130
+ STRINGS=/home/align-anything/miniconda3/envs/jy-align/bin/x86_64-conda-linux-gnu-strings
131
+ STRIP=/home/align-anything/miniconda3/envs/jy-align/bin/x86_64-conda-linux-gnu-strip
132
+ TERM=screen
133
+ TERM_PROGRAM=vscode
134
+ TERM_PROGRAM_VERSION=0.41.3
135
+ TMUX=/tmp/tmux-2000/default,34082,15
136
+ TMUX_PANE=%15
137
+ USER=align-anything
138
+ VSCODE_GIT_ASKPASS_EXTRA_ARGS=
139
+ VSCODE_GIT_ASKPASS_MAIN=/home/align-anything/.cursor-server/cli/servers/Stable-51c8aff7cb5a89f4a0e462fbacab938bdbfaf140/server/extensions/git/dist/askpass-main.js
140
+ VSCODE_GIT_ASKPASS_NODE=/home/align-anything/.cursor-server/cli/servers/Stable-51c8aff7cb5a89f4a0e462fbacab938bdbfaf140/server/node
141
+ VSCODE_GIT_IPC_HANDLE=/run/user/2000/vscode-git-ef8058c264.sock
142
+ VSCODE_IPC_HOOK_CLI=/run/user/2000/vscode-ipc-db013265-9a8a-4fb7-ba94-00b66d808feb.sock
143
+ WANDB_API_KEY=c072b41ab5beb29a43942f29660da87354fd3612
144
+ WANDB_SERVICE=2-3156467-tcp-localhost-37181
145
+ WORLD_SIZE=8
146
+ XDG_DATA_DIRS=/usr/local/share:/usr/share:/var/lib/snapd/desktop
147
+ XDG_RUNTIME_DIR=/run/user/2000
148
+ XDG_SESSION_CLASS=user
149
+ XDG_SESSION_ID=11
150
+ XDG_SESSION_TYPE=tty
151
+ _=/home/align-anything/miniconda3/envs/jy-align/bin/deepspeed
152
+ _CE_CONDA=
153
+ _CE_M=
154
+ _CONDA_PYTHON_SYSCONFIGDATA_NAME=_sysconfigdata_x86_64_conda_cos6_linux_gnu
155
+ build_alias=x86_64-conda-linux-gnu
156
+ host_alias=x86_64-conda-linux-gnu
preprocessor_config.json ADDED
@@ -0,0 +1,28 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "crop_size": {
3
+ "height": 336,
4
+ "width": 336
5
+ },
6
+ "do_center_crop": true,
7
+ "do_convert_rgb": true,
8
+ "do_normalize": true,
9
+ "do_rescale": true,
10
+ "do_resize": true,
11
+ "image_mean": [
12
+ 0.48145466,
13
+ 0.4578275,
14
+ 0.40821073
15
+ ],
16
+ "image_processor_type": "CLIPImageProcessor",
17
+ "image_std": [
18
+ 0.26862954,
19
+ 0.26130258,
20
+ 0.27577711
21
+ ],
22
+ "processor_class": "LlavaProcessor",
23
+ "resample": 3,
24
+ "rescale_factor": 0.00392156862745098,
25
+ "size": {
26
+ "shortest_edge": 336
27
+ }
28
+ }
processor_config.json ADDED
@@ -0,0 +1,6 @@
 
 
 
 
 
 
 
1
+ {
2
+ "image_token": "<image>",
3
+ "patch_size": null,
4
+ "processor_class": "LlavaProcessor",
5
+ "vision_feature_select_strategy": null
6
+ }
pytorch_model.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0d1bb8dc467d996f37ec04ef316c32fd51f8fe8b0a369e1be087fade93ee1a21
3
+ size 26703272169
script.sh ADDED
@@ -0,0 +1,34 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ MODEL_NAME_OR_PATH="/data/models/llava/llava-1.5-13b-hf" # model path
2
+
3
+ TRAIN_DATASETS="/data/align-anything/jiayi/ti2t/refine_gen_wo_res/1021_13b_2000" # dataset path
4
+ TRAIN_TEMPLATE="AA_TI2T_Critique" # dataset template
5
+ TRAIN_SPLIT="train" # split the dataset
6
+
7
+ PTX_DATASETS="/data/align-anything/jiayi/ti2t/ti-to-t-instruction-following"
8
+ PTX_TEMPLATE="AA_TI2T"
9
+ PTX_SPLIT="train"
10
+
11
+ OUTPUT_DIR="/data/align-anything/jiayi/ti2t/rm_10_22_ours_13b_2000/slice_2392" # output dir
12
+ export CUDA_HOME='/data/align-anything/miniconda3/envs/jy-s'
13
+ # For wandb online logging
14
+ export WANDB_API_KEY="c072b41ab5beb29a43942f29660da87354fd3612"
15
+ export NCCL_SOCKET_IFNAME="bond0.212"
16
+
17
+ # Source the setup script
18
+ source ./setup.sh
19
+
20
+ # Execute deepspeed command
21
+ deepspeed \
22
+ --hostfile ./hostfile \
23
+ --master_port ${MASTER_PORT} \
24
+ --module align_anything.trainers.text_image_to_text.dpo \
25
+ --model_name_or_path ${MODEL_NAME_OR_PATH} \
26
+ --train_datasets ${TRAIN_DATASETS} \
27
+ --train_template ${TRAIN_TEMPLATE} \
28
+ --train_split ${TRAIN_SPLIT} \
29
+ --ptx_datasets ${PTX_DATASETS} \
30
+ --ptx_template ${PTX_TEMPLATE} \
31
+ --ptx_split ${PTX_SPLIT} \
32
+ --output_dir ${OUTPUT_DIR} \
33
+ --save_interval 1200 \
34
+ --epochs 5
special_tokens_map.json ADDED
@@ -0,0 +1,30 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "bos_token": {
3
+ "content": "<s>",
4
+ "lstrip": false,
5
+ "normalized": false,
6
+ "rstrip": false,
7
+ "single_word": false
8
+ },
9
+ "eos_token": {
10
+ "content": "</s>",
11
+ "lstrip": false,
12
+ "normalized": false,
13
+ "rstrip": false,
14
+ "single_word": false
15
+ },
16
+ "pad_token": {
17
+ "content": "<pad>",
18
+ "lstrip": false,
19
+ "normalized": false,
20
+ "rstrip": false,
21
+ "single_word": false
22
+ },
23
+ "unk_token": {
24
+ "content": "<unk>",
25
+ "lstrip": false,
26
+ "normalized": false,
27
+ "rstrip": false,
28
+ "single_word": false
29
+ }
30
+ }
tokenizer.json ADDED
The diff for this file is too large to render. See raw diff
 
tokenizer.model ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9e556afd44213b6bd1be2b850ebbbd98f5481437a8021afaf58ee7fb1818d347
3
+ size 499723
tokenizer_config.json ADDED
@@ -0,0 +1,60 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "add_bos_token": true,
3
+ "add_eos_token": false,
4
+ "add_prefix_space": null,
5
+ "added_tokens_decoder": {
6
+ "0": {
7
+ "content": "<unk>",
8
+ "lstrip": false,
9
+ "normalized": false,
10
+ "rstrip": false,
11
+ "single_word": false,
12
+ "special": true
13
+ },
14
+ "1": {
15
+ "content": "<s>",
16
+ "lstrip": false,
17
+ "normalized": false,
18
+ "rstrip": false,
19
+ "single_word": false,
20
+ "special": true
21
+ },
22
+ "2": {
23
+ "content": "</s>",
24
+ "lstrip": false,
25
+ "normalized": false,
26
+ "rstrip": false,
27
+ "single_word": false,
28
+ "special": true
29
+ },
30
+ "32000": {
31
+ "content": "<image>",
32
+ "lstrip": false,
33
+ "normalized": false,
34
+ "rstrip": false,
35
+ "single_word": false,
36
+ "special": true
37
+ },
38
+ "32001": {
39
+ "content": "<pad>",
40
+ "lstrip": false,
41
+ "normalized": false,
42
+ "rstrip": false,
43
+ "single_word": false,
44
+ "special": true
45
+ }
46
+ },
47
+ "bos_token": "<s>",
48
+ "clean_up_tokenization_spaces": false,
49
+ "eos_token": "</s>",
50
+ "legacy": false,
51
+ "model_max_length": 2048,
52
+ "pad_token": "<pad>",
53
+ "padding_side": "right",
54
+ "processor_class": "LlavaProcessor",
55
+ "sp_model_kwargs": {},
56
+ "tokenizer_class": "LlamaTokenizer",
57
+ "trust_remote_code": false,
58
+ "unk_token": "<unk>",
59
+ "use_default_system_prompt": false
60
+ }
wandb/debug-internal.log ADDED
@@ -0,0 +1,25 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {"time":"2024-10-23T19:53:32.034282892Z","level":"INFO","msg":"using version","core version":"0.18.5"}
2
+ {"time":"2024-10-23T19:53:32.034313596Z","level":"INFO","msg":"created symlink","path":"/data/align-anything/jiayi/ti2t/rm_10_22_ours_13b_2000/wandb/run-20241023_195332-5p9x2ymn/logs/debug-core.log"}
3
+ {"time":"2024-10-23T19:53:32.257077888Z","level":"INFO","msg":"created new stream","id":"5p9x2ymn"}
4
+ {"time":"2024-10-23T19:53:32.25716001Z","level":"INFO","msg":"stream: started","id":"5p9x2ymn"}
5
+ {"time":"2024-10-23T19:53:32.257194334Z","level":"INFO","msg":"sender: started","stream_id":"5p9x2ymn"}
6
+ {"time":"2024-10-23T19:53:32.257175304Z","level":"INFO","msg":"handler: started","stream_id":{"value":"5p9x2ymn"}}
7
+ {"time":"2024-10-23T19:53:32.257226079Z","level":"INFO","msg":"writer: Do: started","stream_id":{"value":"5p9x2ymn"}}
8
+ {"time":"2024-10-23T19:53:33.030824275Z","level":"INFO","msg":"Starting system monitor"}
9
+ {"time":"2024-10-23T23:33:34.192965196Z","level":"INFO","msg":"api: retrying HTTP error","status":502,"url":"https://api.wandb.ai/files/524339208/align-anything/5p9x2ymn/file_stream"}
10
+ {"time":"2024-10-24T00:17:33.02116761Z","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/graphql\": context deadline exceeded"}
11
+ {"time":"2024-10-24T00:17:38.542096425Z","level":"INFO","msg":"api: retrying HTTP error","status":502,"url":"https://api.wandb.ai/files/524339208/align-anything/5p9x2ymn/file_stream"}
12
+ {"time":"2024-10-24T00:33:58.505798828Z","level":"INFO","msg":"api: retrying HTTP error","status":502,"url":"https://api.wandb.ai/files/524339208/align-anything/5p9x2ymn/file_stream"}
13
+ {"time":"2024-10-24T03:15:33.036197732Z","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/524339208/align-anything/5p9x2ymn/file_stream\": EOF"}
14
+ {"time":"2024-10-24T03:15:33.036293074Z","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/graphql\": unexpected EOF"}
15
+ {"time":"2024-10-24T06:50:25.927379401Z","level":"INFO","msg":"Stopping system monitor"}
16
+ {"time":"2024-10-24T06:50:25.928726748Z","level":"INFO","msg":"Stopped system monitor"}
17
+ {"time":"2024-10-24T06:50:26.45386731Z","level":"WARN","msg":"No program path found, not creating job artifact. See https://docs.wandb.ai/guides/launch/create-job"}
18
+ {"time":"2024-10-24T06:50:26.453900793Z","level":"INFO","msg":"sender: sendDefer: no job artifact to save"}
19
+ {"time":"2024-10-24T06:50:26.928252456Z","level":"INFO","msg":"handler: operation stats","stats":{"operations":[{"desc":"uploading wandb-summary.json","runtime_seconds":0.450821229,"progress":"331B/331B"},{"desc":"uploading config.yaml","runtime_seconds":0.185946124,"progress":"2.5KB/2.5KB"},{"desc":"uploading output.log","runtime_seconds":0.185925636,"progress":"64.0KB/291.8KB"}],"total_operations":3}}
20
+ {"time":"2024-10-24T06:50:27.530089799Z","level":"INFO","msg":"fileTransfer: Close: file transfer manager closed"}
21
+ {"time":"2024-10-24T06:50:29.024633815Z","level":"INFO","msg":"stream: closing","id":"5p9x2ymn"}
22
+ {"time":"2024-10-24T06:50:29.024666435Z","level":"INFO","msg":"handler: closed","stream_id":{"value":"5p9x2ymn"}}
23
+ {"time":"2024-10-24T06:50:29.024712782Z","level":"INFO","msg":"sender: closed","stream_id":"5p9x2ymn"}
24
+ {"time":"2024-10-24T06:50:29.024699477Z","level":"INFO","msg":"writer: Close: closed","stream_id":{"value":"5p9x2ymn"}}
25
+ {"time":"2024-10-24T06:50:29.025524254Z","level":"INFO","msg":"stream: closed","id":"5p9x2ymn"}
wandb/debug.log ADDED
@@ -0,0 +1,33 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ 2024-10-23 19:53:32,022 INFO MainThread:3156467 [wandb_setup.py:_flush():79] Current SDK version is 0.18.5
2
+ 2024-10-23 19:53:32,022 INFO MainThread:3156467 [wandb_setup.py:_flush():79] Configure stats pid to 3156467
3
+ 2024-10-23 19:53:32,022 INFO MainThread:3156467 [wandb_setup.py:_flush():79] Loading settings from /home/align-anything/.config/wandb/settings
4
+ 2024-10-23 19:53:32,022 INFO MainThread:3156467 [wandb_setup.py:_flush():79] Loading settings from /home/align-anything/align-anything/local_scripts/wandb/settings
5
+ 2024-10-23 19:53:32,022 INFO MainThread:3156467 [wandb_setup.py:_flush():79] Loading settings from environment variables: {'api_key': '***REDACTED***'}
6
+ 2024-10-23 19:53:32,022 INFO MainThread:3156467 [wandb_setup.py:_flush():79] Applying setup settings: {'mode': None, '_disable_service': None}
7
+ 2024-10-23 19:53:32,022 WARNING MainThread:3156467 [wandb_setup.py:_flush():79] Could not find program at -m align_anything.trainers.text_image_to_text.rm
8
+ 2024-10-23 19:53:32,022 INFO MainThread:3156467 [wandb_setup.py:_flush():79] Inferring run settings from compute environment: {'program_relpath': None, 'program': '-m align_anything.trainers.text_image_to_text.rm'}
9
+ 2024-10-23 19:53:32,022 INFO MainThread:3156467 [wandb_setup.py:_flush():79] Applying login settings: {}
10
+ 2024-10-23 19:53:32,023 INFO MainThread:3156467 [wandb_init.py:_log_setup():534] Logging user logs to /data/align-anything/jiayi/ti2t/rm_10_22_ours_13b_2000/wandb/run-20241023_195332-5p9x2ymn/logs/debug.log
11
+ 2024-10-23 19:53:32,023 INFO MainThread:3156467 [wandb_init.py:_log_setup():535] Logging internal logs to /data/align-anything/jiayi/ti2t/rm_10_22_ours_13b_2000/wandb/run-20241023_195332-5p9x2ymn/logs/debug-internal.log
12
+ 2024-10-23 19:53:32,023 INFO MainThread:3156467 [wandb_init.py:init():621] calling init triggers
13
+ 2024-10-23 19:53:32,023 INFO MainThread:3156467 [wandb_init.py:init():628] wandb.init called with sweep_config: {}
14
+ config: {'train_cfgs': {'ds_cfgs': 'ds_z3_config.json', 'epochs': 5.0, 'seed': 42, 'per_device_train_batch_size': 4, 'per_device_eval_batch_size': 4, 'gradient_accumulation_steps': 1, 'gradient_checkpointing': True, 'learning_rate': 3e-05, 'lr_scheduler_type': 'constant_with_warmup', 'lr_warmup_ratio': 0.03, 'weight_decay': 0.0, 'adam_betas': [0.9, 0.95], 'bf16': True, 'fp16': False, 'eval_strategy': 'epoch', 'eval_interval': 10, 'regularization': 0.001, 'freeze_mm_proj': False, 'freeze_vision_tower': True, 'freeze_language_model': False}, 'data_cfgs': {'train_datasets': '/data/align-anything/jiayi/ti2t/refine_gen_wo_res/1021_13b_2000', 'train_template': 'AA_TI2T_Critique', 'train_name': None, 'train_size': None, 'train_split': 'train', 'train_subset': None, 'train_data_files': None, 'train_optional_args': [], 'eval_datasets': '/home/align-anything/datasets/40k_ti2t_filtered', 'eval_template': 'AA_TI2T', 'eval_name': None, 'eval_size': None, 'eval_split': 'train', 'eval_subset': None, 'eval_data_files': None, 'eval_optional_args': []}, 'logger_cfgs': {'log_type': 'wandb', 'log_project': 'align-anything', 'log_run_name': 'rm', 'output_dir': '/data/align-anything/jiayi/ti2t/rm_10_22_ours_13b_2000', 'cache_dir': None, 'save_interval': 598.0}, 'model_cfgs': {'model_name_or_path': '/data/models/llava/llava-1.5-13b-hf', 'trust_remote_code': True, 'model_max_length': 2048}, 'special_tokens': None}
15
+ 2024-10-23 19:53:32,023 INFO MainThread:3156467 [wandb_init.py:init():671] starting backend
16
+ 2024-10-23 19:53:32,023 INFO MainThread:3156467 [wandb_init.py:init():675] sending inform_init request
17
+ 2024-10-23 19:53:32,027 INFO MainThread:3156467 [backend.py:_multiprocessing_setup():104] multiprocessing start_methods=fork,spawn,forkserver, using: spawn
18
+ 2024-10-23 19:53:32,027 INFO MainThread:3156467 [wandb_init.py:init():688] backend started and connected
19
+ 2024-10-23 19:53:32,030 INFO MainThread:3156467 [wandb_init.py:init():783] updated telemetry
20
+ 2024-10-23 19:53:32,036 INFO MainThread:3156467 [wandb_init.py:init():816] communicating run to backend with 90.0 second timeout
21
+ 2024-10-23 19:53:33,024 INFO MainThread:3156467 [wandb_init.py:init():867] starting run threads in backend
22
+ 2024-10-23 19:53:33,160 INFO MainThread:3156467 [wandb_run.py:_console_start():2463] atexit reg
23
+ 2024-10-23 19:53:33,160 INFO MainThread:3156467 [wandb_run.py:_redirect():2311] redirect: wrap_raw
24
+ 2024-10-23 19:53:33,160 INFO MainThread:3156467 [wandb_run.py:_redirect():2376] Wrapping output streams.
25
+ 2024-10-23 19:53:33,160 INFO MainThread:3156467 [wandb_run.py:_redirect():2401] Redirects installed.
26
+ 2024-10-23 19:53:33,164 INFO MainThread:3156467 [wandb_init.py:init():911] run started, returning control to user process
27
+ 2024-10-24 06:50:25,922 INFO MainThread:3156467 [wandb_run.py:_finish():2158] finishing run 524339208/align-anything/5p9x2ymn
28
+ 2024-10-24 06:50:25,925 INFO MainThread:3156467 [wandb_run.py:_atexit_cleanup():2426] got exitcode: 0
29
+ 2024-10-24 06:50:25,926 INFO MainThread:3156467 [wandb_run.py:_restore():2408] restore
30
+ 2024-10-24 06:50:25,926 INFO MainThread:3156467 [wandb_run.py:_restore():2414] restore done
31
+ 2024-10-24 06:50:29,011 INFO MainThread:3156467 [wandb_run.py:_footer_history_summary_info():3975] rendering history
32
+ 2024-10-24 06:50:29,013 INFO MainThread:3156467 [wandb_run.py:_footer_history_summary_info():4007] rendering summary
33
+ 2024-10-24 06:50:29,023 INFO MainThread:3156467 [wandb_run.py:_footer_sync_info():3934] logging synced files
wandb/run-20241023_195332-5p9x2ymn/files/config.yaml ADDED
@@ -0,0 +1,99 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ _wandb:
2
+ value:
3
+ cli_version: 0.18.5
4
+ m: []
5
+ python_version: 3.11.10
6
+ t:
7
+ "1":
8
+ - 1
9
+ - 11
10
+ - 41
11
+ - 49
12
+ - 51
13
+ - 55
14
+ - 71
15
+ - 83
16
+ - 98
17
+ - 105
18
+ "2":
19
+ - 1
20
+ - 11
21
+ - 41
22
+ - 49
23
+ - 51
24
+ - 55
25
+ - 71
26
+ - 83
27
+ - 98
28
+ - 105
29
+ "3":
30
+ - 2
31
+ - 13
32
+ - 16
33
+ - 23
34
+ - 55
35
+ - 61
36
+ "4": 3.11.10
37
+ "5": 0.18.5
38
+ "6": 4.46.0.dev0
39
+ "8":
40
+ - 5
41
+ "12": 0.18.5
42
+ "13": linux-x86_64
43
+ data_cfgs:
44
+ value:
45
+ eval_data_files: null
46
+ eval_datasets: /home/align-anything/datasets/40k_ti2t_filtered
47
+ eval_name: null
48
+ eval_optional_args: []
49
+ eval_size: null
50
+ eval_split: train
51
+ eval_subset: null
52
+ eval_template: AA_TI2T
53
+ train_data_files: null
54
+ train_datasets: /data/align-anything/jiayi/ti2t/refine_gen_wo_res/1021_13b_2000
55
+ train_name: null
56
+ train_optional_args: []
57
+ train_size: null
58
+ train_split: train
59
+ train_subset: null
60
+ train_template: AA_TI2T_Critique
61
+ logger_cfgs:
62
+ value:
63
+ cache_dir: null
64
+ log_project: align-anything
65
+ log_run_name: rm
66
+ log_type: wandb
67
+ output_dir: /data/align-anything/jiayi/ti2t/rm_10_22_ours_13b_2000
68
+ save_interval: 598
69
+ model_cfgs:
70
+ value:
71
+ model_max_length: 2048
72
+ model_name_or_path: /data/models/llava/llava-1.5-13b-hf
73
+ trust_remote_code: true
74
+ special_tokens:
75
+ value: null
76
+ train_cfgs:
77
+ value:
78
+ adam_betas:
79
+ - 0.9
80
+ - 0.95
81
+ bf16: true
82
+ ds_cfgs: ds_z3_config.json
83
+ epochs: 5
84
+ eval_interval: 10
85
+ eval_strategy: epoch
86
+ fp16: false
87
+ freeze_language_model: false
88
+ freeze_mm_proj: false
89
+ freeze_vision_tower: true
90
+ gradient_accumulation_steps: 1
91
+ gradient_checkpointing: true
92
+ learning_rate: 3e-05
93
+ lr_scheduler_type: constant_with_warmup
94
+ lr_warmup_ratio: 0.03
95
+ per_device_eval_batch_size: 4
96
+ per_device_train_batch_size: 4
97
+ regularization: 0.001
98
+ seed: 42
99
+ weight_decay: 0
wandb/run-20241023_195332-5p9x2ymn/files/output.log ADDED
The diff for this file is too large to render. See raw diff
 
wandb/run-20241023_195332-5p9x2ymn/files/requirements.txt ADDED
@@ -0,0 +1,233 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ align-anything==0.0.1.dev0
2
+ PyYAML==6.0.2
3
+ frozenlist==1.4.1
4
+ contourpy==1.3.0
5
+ tokenizers==0.20.0
6
+ nvidia-cusolver-cu12==11.4.5.107
7
+ nvidia-ml-py==12.535.161
8
+ peft==0.13.1
9
+ opencv-python==4.6.0.66
10
+ tensorboard==2.18.0
11
+ typer==0.12.5
12
+ watchfiles==0.24.0
13
+ sentry-sdk==2.16.0
14
+ frechet-audio-distance==0.1.2
15
+ nvitop==1.3.2
16
+ virtualenv==20.26.6
17
+ nvidia-cuda-nvrtc-cu12==12.1.105
18
+ openai==1.51.2
19
+ gguf==0.10.0
20
+ resampy==0.4.3
21
+ typing_extensions==4.12.2
22
+ pandas==2.2.3
23
+ sympy==1.13.3
24
+ Werkzeug==3.0.4
25
+ jsonschema==4.23.0
26
+ httptools==0.6.1
27
+ compressed-tensors==0.6.0
28
+ httpcore==1.0.6
29
+ nvidia-cufft-cu12==11.0.2.54
30
+ semantic-version==2.10.0
31
+ fairscale==0.4.13
32
+ websockets==12.0
33
+ outlines==0.0.46
34
+ annotated-types==0.7.0
35
+ pyzmq==26.2.0
36
+ shellingham==1.5.4
37
+ starlette==0.38.6
38
+ gitdb==4.0.11
39
+ cfgv==3.4.0
40
+ gradio==4.44.1
41
+ matplotlib==3.9.2
42
+ librosa==0.10.2.post1
43
+ aiohttp==3.10.9
44
+ lazy_loader==0.4
45
+ torchvision==0.19.0
46
+ mdurl==0.1.2
47
+ safetensors==0.4.5
48
+ diffusers==0.30.3
49
+ Jinja2==3.1.4
50
+ nest-asyncio==1.6.0
51
+ imageio==2.35.1
52
+ setproctitle==1.3.3
53
+ markdown-it-py==3.0.0
54
+ uvloop==0.20.0
55
+ pluggy==1.5.0
56
+ nvidia-curand-cu12==10.3.2.106
57
+ distlib==0.3.8
58
+ mpmath==1.3.0
59
+ cachetools==5.5.0
60
+ nodeenv==1.9.1
61
+ referencing==0.35.1
62
+ prometheus_client==0.21.0
63
+ torchlibrosa==0.1.0
64
+ sniffio==1.3.1
65
+ pydub==0.25.1
66
+ nvidia-cusparse-cu12==12.1.0.106
67
+ imageio-ffmpeg==0.5.1
68
+ filelock==3.16.1
69
+ six==1.16.0
70
+ cycler==0.12.1
71
+ wheel==0.44.0
72
+ tiktoken==0.7.0
73
+ clint==0.5.1
74
+ wandb==0.18.5
75
+ Brotli==1.1.0
76
+ pyparsing==3.1.4
77
+ audioread==3.0.1
78
+ python-dotenv==1.0.1
79
+ tensorboard-data-server==0.7.2
80
+ image-reward==1.5
81
+ accelerate==1.0.0
82
+ threadpoolctl==3.5.0
83
+ tqdm==4.66.5
84
+ gradio_client==1.3.0
85
+ aiosignal==1.3.1
86
+ pytz==2024.2
87
+ bitsandbytes==0.44.1
88
+ distro==1.9.0
89
+ importlib_metadata==8.5.0
90
+ networkx==3.3
91
+ aiofiles==23.2.1
92
+ nvidia-cudnn-cu12==9.1.0.70
93
+ anyio==4.6.0
94
+ pydantic==2.9.2
95
+ pyairports==2.1.1
96
+ shortuuid==1.0.13
97
+ msgpack==1.1.0
98
+ einops==0.8.0
99
+ click==8.1.7
100
+ rich==13.9.2
101
+ jiter==0.6.1
102
+ cloudpickle==3.0.0
103
+ kiwisolver==1.4.7
104
+ tzdata==2024.2
105
+ opencv-python-headless==4.10.0.84
106
+ uvicorn==0.31.0
107
+ sentencepiece==0.2.0
108
+ soxr==0.5.0.post1
109
+ docker-pycreds==0.4.0
110
+ Markdown==3.7
111
+ nvidia-nvjitlink-cu12==12.6.77
112
+ multidict==6.1.0
113
+ pytorch-fid==0.3.0
114
+ h11==0.14.0
115
+ torchaudio==2.4.0
116
+ zipp==3.20.2
117
+ moviepy==1.0.3
118
+ grpcio==1.66.2
119
+ wcwidth==0.2.13
120
+ propcache==0.2.0
121
+ clip==0.2.0
122
+ tomlkit==0.12.0
123
+ ruff==0.6.9
124
+ aiohappyeyeballs==2.4.3
125
+ psutil==6.0.0
126
+ deepspeed==0.15.1
127
+ scikit-learn==1.5.2
128
+ certifi==2024.8.30
129
+ yarl==1.14.0
130
+ nvidia-nvtx-cu12==12.1.105
131
+ ffmpy==0.4.0
132
+ vllm==0.6.3.post1
133
+ optree==0.13.0
134
+ ftfy==6.2.3
135
+ importlib_resources==6.4.5
136
+ idna==3.10
137
+ absl-py==2.1.0
138
+ ray==2.37.0
139
+ pycryptodomex==3.21.0
140
+ nvidia-nccl-cu12==2.20.5
141
+ decorator==4.4.2
142
+ fsspec==2024.6.1
143
+ mutagen==1.47.0
144
+ partial-json-parser==0.2.1.1.post4
145
+ xxhash==3.5.0
146
+ scipy==1.14.1
147
+ pip==24.2
148
+ align-anything==0.0.1.dev0
149
+ yt-dlp==2024.8.6
150
+ diskcache==5.6.3
151
+ datasets==3.0.1
152
+ attrs==24.2.0
153
+ httpx==0.27.2
154
+ nvidia-cuda-runtime-cu12==12.1.105
155
+ webdataset==0.2.100
156
+ torch==2.4.0
157
+ pyarrow==17.0.0
158
+ numpy==1.26.4
159
+ python-multipart==0.0.12
160
+ pillow==10.4.0
161
+ msgspec==0.18.6
162
+ python-dateutil==2.9.0.post0
163
+ setuptools==75.1.0
164
+ orjson==3.10.7
165
+ fonttools==4.54.1
166
+ platformdirs==4.3.6
167
+ pycountry==24.6.1
168
+ lark==1.2.2
169
+ soundfile==0.12.1
170
+ smmap==5.0.1
171
+ prometheus-fastapi-instrumentator==7.0.0
172
+ xformers==0.0.27.post2
173
+ regex==2024.9.11
174
+ pycparser==2.22
175
+ cffi==1.17.1
176
+ mistral_common==1.4.4
177
+ fastapi==0.115.0
178
+ hpsv2==1.2.0
179
+ pooch==1.8.2
180
+ braceexpand==0.1.7
181
+ joblib==1.4.2
182
+ requests==2.32.3
183
+ pytest==7.2.0
184
+ identify==2.6.1
185
+ interegular==0.3.3
186
+ termcolor==2.5.0
187
+ args==0.1.0
188
+ Pygments==2.18.0
189
+ py-cpuinfo==9.0.0
190
+ nvidia-cublas-cu12==12.1.3.1
191
+ MarkupSafe==2.1.5
192
+ triton==3.0.0
193
+ jsonschema-specifications==2024.10.1
194
+ pydantic_core==2.23.4
195
+ huggingface-hub==0.25.1
196
+ transformers==4.46.0.dev0
197
+ hjson==3.1.0
198
+ urllib3==2.2.3
199
+ llvmlite==0.43.0
200
+ multiprocess==0.70.16
201
+ numba==0.60.0
202
+ some-package==0.1
203
+ dill==0.3.8
204
+ pre_commit==4.0.1
205
+ protobuf==3.20.3
206
+ GitPython==3.1.43
207
+ packaging==24.1
208
+ proglog==0.1.10
209
+ timm==0.6.13
210
+ lm-format-enforcer==0.10.6
211
+ iniconfig==2.0.0
212
+ ninja==1.11.1.1
213
+ pytest-split==0.8.0
214
+ nvidia-cuda-cupti-cu12==12.1.105
215
+ rpds-py==0.20.0
216
+ charset-normalizer==3.3.2
217
+ jaraco.functools==4.0.1
218
+ typing_extensions==4.12.2
219
+ importlib_resources==6.4.0
220
+ jaraco.text==3.12.1
221
+ importlib_metadata==8.0.0
222
+ zipp==3.19.2
223
+ autocommand==2.2.2
224
+ tomli==2.0.1
225
+ wheel==0.43.0
226
+ inflect==7.3.1
227
+ jaraco.collections==5.1.0
228
+ jaraco.context==5.3.0
229
+ typeguard==4.3.0
230
+ platformdirs==4.2.2
231
+ backports.tarfile==1.2.0
232
+ more-itertools==10.3.0
233
+ packaging==24.1
wandb/run-20241023_195332-5p9x2ymn/files/wandb-metadata.json ADDED
@@ -0,0 +1,106 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "os": "Linux-5.4.0-196-generic-x86_64-with-glibc2.31",
3
+ "python": "3.11.10",
4
+ "startedAt": "2024-10-23T19:53:32.027977Z",
5
+ "args": [
6
+ "--local_rank=0",
7
+ "--model_name_or_path",
8
+ "/data/models/llava/llava-1.5-13b-hf",
9
+ "--train_datasets",
10
+ "/data/align-anything/jiayi/ti2t/refine_gen_wo_res/1021_13b_2000",
11
+ "--train_template",
12
+ "AA_TI2T_Critique",
13
+ "--train_split",
14
+ "train",
15
+ "--eval_datasets",
16
+ "/home/align-anything/datasets/40k_ti2t_filtered",
17
+ "--eval_template",
18
+ "AA_TI2T",
19
+ "--eval_split",
20
+ "train",
21
+ "--output_dir",
22
+ "/data/align-anything/jiayi/ti2t/rm_10_22_ours_13b_2000",
23
+ "--save_interval",
24
+ "598",
25
+ "--epochs",
26
+ "5"
27
+ ],
28
+ "program": "-m align_anything.trainers.text_image_to_text.rm",
29
+ "git": {
30
+ "remote": "https://github.com/Gaiejj/align-anything.git",
31
+ "commit": "95ea3305a3d37850670c72e0af8e5a16cfb8177b"
32
+ },
33
+ "email": "524339208@qq.com",
34
+ "root": "/data/align-anything/jiayi/ti2t/rm_10_22_ours_13b_2000",
35
+ "host": "lyg0194",
36
+ "username": "align-anything",
37
+ "executable": "/home/align-anything/miniconda3/envs/jy-align/bin/python",
38
+ "cpu_count": 64,
39
+ "cpu_count_logical": 128,
40
+ "gpu": "NVIDIA A100-SXM4-80GB",
41
+ "gpu_count": 8,
42
+ "disk": {
43
+ "/": {
44
+ "total": "939477946368",
45
+ "used": "771994755072"
46
+ }
47
+ },
48
+ "memory": {
49
+ "total": "1081823907840"
50
+ },
51
+ "cpu": {
52
+ "count": 64,
53
+ "countLogical": 128
54
+ },
55
+ "gpu_nvidia": [
56
+ {
57
+ "name": "NVIDIA A100-SXM4-80GB",
58
+ "memoryTotal": "85899345920",
59
+ "cudaCores": 6912,
60
+ "architecture": "Ampere"
61
+ },
62
+ {
63
+ "name": "NVIDIA A100-SXM4-80GB",
64
+ "memoryTotal": "85899345920",
65
+ "cudaCores": 6912,
66
+ "architecture": "Ampere"
67
+ },
68
+ {
69
+ "name": "NVIDIA A100-SXM4-80GB",
70
+ "memoryTotal": "85899345920",
71
+ "cudaCores": 6912,
72
+ "architecture": "Ampere"
73
+ },
74
+ {
75
+ "name": "NVIDIA A100-SXM4-80GB",
76
+ "memoryTotal": "85899345920",
77
+ "cudaCores": 6912,
78
+ "architecture": "Ampere"
79
+ },
80
+ {
81
+ "name": "NVIDIA A100-SXM4-80GB",
82
+ "memoryTotal": "85899345920",
83
+ "cudaCores": 6912,
84
+ "architecture": "Ampere"
85
+ },
86
+ {
87
+ "name": "NVIDIA A100-SXM4-80GB",
88
+ "memoryTotal": "85899345920",
89
+ "cudaCores": 6912,
90
+ "architecture": "Ampere"
91
+ },
92
+ {
93
+ "name": "NVIDIA A100-SXM4-80GB",
94
+ "memoryTotal": "85899345920",
95
+ "cudaCores": 6912,
96
+ "architecture": "Ampere"
97
+ },
98
+ {
99
+ "name": "NVIDIA A100-SXM4-80GB",
100
+ "memoryTotal": "85899345920",
101
+ "cudaCores": 6912,
102
+ "architecture": "Ampere"
103
+ }
104
+ ],
105
+ "cudaVersion": "12.4"
106
+ }
wandb/run-20241023_195332-5p9x2ymn/files/wandb-summary.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"_timestamp":1.7297525127125318e+09,"train/loss":0.02179259993135929,"train/step":5980,"eval/accuracy":0.670096218585968,"train/accuracy":1,"eval/step":5980,"eval/reward_mean":6.753208637237549,"_step":5980,"train/lr":3e-05,"train/epoch":5,"_runtime":39413.899368224,"eval/reward_std":3.374933958053589,"_wandb":{"runtime":39413}}
wandb/run-20241023_195332-5p9x2ymn/logs/debug-internal.log ADDED
@@ -0,0 +1,25 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {"time":"2024-10-23T19:53:32.034282892Z","level":"INFO","msg":"using version","core version":"0.18.5"}
2
+ {"time":"2024-10-23T19:53:32.034313596Z","level":"INFO","msg":"created symlink","path":"/data/align-anything/jiayi/ti2t/rm_10_22_ours_13b_2000/wandb/run-20241023_195332-5p9x2ymn/logs/debug-core.log"}
3
+ {"time":"2024-10-23T19:53:32.257077888Z","level":"INFO","msg":"created new stream","id":"5p9x2ymn"}
4
+ {"time":"2024-10-23T19:53:32.25716001Z","level":"INFO","msg":"stream: started","id":"5p9x2ymn"}
5
+ {"time":"2024-10-23T19:53:32.257194334Z","level":"INFO","msg":"sender: started","stream_id":"5p9x2ymn"}
6
+ {"time":"2024-10-23T19:53:32.257175304Z","level":"INFO","msg":"handler: started","stream_id":{"value":"5p9x2ymn"}}
7
+ {"time":"2024-10-23T19:53:32.257226079Z","level":"INFO","msg":"writer: Do: started","stream_id":{"value":"5p9x2ymn"}}
8
+ {"time":"2024-10-23T19:53:33.030824275Z","level":"INFO","msg":"Starting system monitor"}
9
+ {"time":"2024-10-23T23:33:34.192965196Z","level":"INFO","msg":"api: retrying HTTP error","status":502,"url":"https://api.wandb.ai/files/524339208/align-anything/5p9x2ymn/file_stream"}
10
+ {"time":"2024-10-24T00:17:33.02116761Z","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/graphql\": context deadline exceeded"}
11
+ {"time":"2024-10-24T00:17:38.542096425Z","level":"INFO","msg":"api: retrying HTTP error","status":502,"url":"https://api.wandb.ai/files/524339208/align-anything/5p9x2ymn/file_stream"}
12
+ {"time":"2024-10-24T00:33:58.505798828Z","level":"INFO","msg":"api: retrying HTTP error","status":502,"url":"https://api.wandb.ai/files/524339208/align-anything/5p9x2ymn/file_stream"}
13
+ {"time":"2024-10-24T03:15:33.036197732Z","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/524339208/align-anything/5p9x2ymn/file_stream\": EOF"}
14
+ {"time":"2024-10-24T03:15:33.036293074Z","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/graphql\": unexpected EOF"}
15
+ {"time":"2024-10-24T06:50:25.927379401Z","level":"INFO","msg":"Stopping system monitor"}
16
+ {"time":"2024-10-24T06:50:25.928726748Z","level":"INFO","msg":"Stopped system monitor"}
17
+ {"time":"2024-10-24T06:50:26.45386731Z","level":"WARN","msg":"No program path found, not creating job artifact. See https://docs.wandb.ai/guides/launch/create-job"}
18
+ {"time":"2024-10-24T06:50:26.453900793Z","level":"INFO","msg":"sender: sendDefer: no job artifact to save"}
19
+ {"time":"2024-10-24T06:50:26.928252456Z","level":"INFO","msg":"handler: operation stats","stats":{"operations":[{"desc":"uploading wandb-summary.json","runtime_seconds":0.450821229,"progress":"331B/331B"},{"desc":"uploading config.yaml","runtime_seconds":0.185946124,"progress":"2.5KB/2.5KB"},{"desc":"uploading output.log","runtime_seconds":0.185925636,"progress":"64.0KB/291.8KB"}],"total_operations":3}}
20
+ {"time":"2024-10-24T06:50:27.530089799Z","level":"INFO","msg":"fileTransfer: Close: file transfer manager closed"}
21
+ {"time":"2024-10-24T06:50:29.024633815Z","level":"INFO","msg":"stream: closing","id":"5p9x2ymn"}
22
+ {"time":"2024-10-24T06:50:29.024666435Z","level":"INFO","msg":"handler: closed","stream_id":{"value":"5p9x2ymn"}}
23
+ {"time":"2024-10-24T06:50:29.024712782Z","level":"INFO","msg":"sender: closed","stream_id":"5p9x2ymn"}
24
+ {"time":"2024-10-24T06:50:29.024699477Z","level":"INFO","msg":"writer: Close: closed","stream_id":{"value":"5p9x2ymn"}}
25
+ {"time":"2024-10-24T06:50:29.025524254Z","level":"INFO","msg":"stream: closed","id":"5p9x2ymn"}
wandb/run-20241023_195332-5p9x2ymn/logs/debug.log ADDED
@@ -0,0 +1,33 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ 2024-10-23 19:53:32,022 INFO MainThread:3156467 [wandb_setup.py:_flush():79] Current SDK version is 0.18.5
2
+ 2024-10-23 19:53:32,022 INFO MainThread:3156467 [wandb_setup.py:_flush():79] Configure stats pid to 3156467
3
+ 2024-10-23 19:53:32,022 INFO MainThread:3156467 [wandb_setup.py:_flush():79] Loading settings from /home/align-anything/.config/wandb/settings
4
+ 2024-10-23 19:53:32,022 INFO MainThread:3156467 [wandb_setup.py:_flush():79] Loading settings from /home/align-anything/align-anything/local_scripts/wandb/settings
5
+ 2024-10-23 19:53:32,022 INFO MainThread:3156467 [wandb_setup.py:_flush():79] Loading settings from environment variables: {'api_key': '***REDACTED***'}
6
+ 2024-10-23 19:53:32,022 INFO MainThread:3156467 [wandb_setup.py:_flush():79] Applying setup settings: {'mode': None, '_disable_service': None}
7
+ 2024-10-23 19:53:32,022 WARNING MainThread:3156467 [wandb_setup.py:_flush():79] Could not find program at -m align_anything.trainers.text_image_to_text.rm
8
+ 2024-10-23 19:53:32,022 INFO MainThread:3156467 [wandb_setup.py:_flush():79] Inferring run settings from compute environment: {'program_relpath': None, 'program': '-m align_anything.trainers.text_image_to_text.rm'}
9
+ 2024-10-23 19:53:32,022 INFO MainThread:3156467 [wandb_setup.py:_flush():79] Applying login settings: {}
10
+ 2024-10-23 19:53:32,023 INFO MainThread:3156467 [wandb_init.py:_log_setup():534] Logging user logs to /data/align-anything/jiayi/ti2t/rm_10_22_ours_13b_2000/wandb/run-20241023_195332-5p9x2ymn/logs/debug.log
11
+ 2024-10-23 19:53:32,023 INFO MainThread:3156467 [wandb_init.py:_log_setup():535] Logging internal logs to /data/align-anything/jiayi/ti2t/rm_10_22_ours_13b_2000/wandb/run-20241023_195332-5p9x2ymn/logs/debug-internal.log
12
+ 2024-10-23 19:53:32,023 INFO MainThread:3156467 [wandb_init.py:init():621] calling init triggers
13
+ 2024-10-23 19:53:32,023 INFO MainThread:3156467 [wandb_init.py:init():628] wandb.init called with sweep_config: {}
14
+ config: {'train_cfgs': {'ds_cfgs': 'ds_z3_config.json', 'epochs': 5.0, 'seed': 42, 'per_device_train_batch_size': 4, 'per_device_eval_batch_size': 4, 'gradient_accumulation_steps': 1, 'gradient_checkpointing': True, 'learning_rate': 3e-05, 'lr_scheduler_type': 'constant_with_warmup', 'lr_warmup_ratio': 0.03, 'weight_decay': 0.0, 'adam_betas': [0.9, 0.95], 'bf16': True, 'fp16': False, 'eval_strategy': 'epoch', 'eval_interval': 10, 'regularization': 0.001, 'freeze_mm_proj': False, 'freeze_vision_tower': True, 'freeze_language_model': False}, 'data_cfgs': {'train_datasets': '/data/align-anything/jiayi/ti2t/refine_gen_wo_res/1021_13b_2000', 'train_template': 'AA_TI2T_Critique', 'train_name': None, 'train_size': None, 'train_split': 'train', 'train_subset': None, 'train_data_files': None, 'train_optional_args': [], 'eval_datasets': '/home/align-anything/datasets/40k_ti2t_filtered', 'eval_template': 'AA_TI2T', 'eval_name': None, 'eval_size': None, 'eval_split': 'train', 'eval_subset': None, 'eval_data_files': None, 'eval_optional_args': []}, 'logger_cfgs': {'log_type': 'wandb', 'log_project': 'align-anything', 'log_run_name': 'rm', 'output_dir': '/data/align-anything/jiayi/ti2t/rm_10_22_ours_13b_2000', 'cache_dir': None, 'save_interval': 598.0}, 'model_cfgs': {'model_name_or_path': '/data/models/llava/llava-1.5-13b-hf', 'trust_remote_code': True, 'model_max_length': 2048}, 'special_tokens': None}
15
+ 2024-10-23 19:53:32,023 INFO MainThread:3156467 [wandb_init.py:init():671] starting backend
16
+ 2024-10-23 19:53:32,023 INFO MainThread:3156467 [wandb_init.py:init():675] sending inform_init request
17
+ 2024-10-23 19:53:32,027 INFO MainThread:3156467 [backend.py:_multiprocessing_setup():104] multiprocessing start_methods=fork,spawn,forkserver, using: spawn
18
+ 2024-10-23 19:53:32,027 INFO MainThread:3156467 [wandb_init.py:init():688] backend started and connected
19
+ 2024-10-23 19:53:32,030 INFO MainThread:3156467 [wandb_init.py:init():783] updated telemetry
20
+ 2024-10-23 19:53:32,036 INFO MainThread:3156467 [wandb_init.py:init():816] communicating run to backend with 90.0 second timeout
21
+ 2024-10-23 19:53:33,024 INFO MainThread:3156467 [wandb_init.py:init():867] starting run threads in backend
22
+ 2024-10-23 19:53:33,160 INFO MainThread:3156467 [wandb_run.py:_console_start():2463] atexit reg
23
+ 2024-10-23 19:53:33,160 INFO MainThread:3156467 [wandb_run.py:_redirect():2311] redirect: wrap_raw
24
+ 2024-10-23 19:53:33,160 INFO MainThread:3156467 [wandb_run.py:_redirect():2376] Wrapping output streams.
25
+ 2024-10-23 19:53:33,160 INFO MainThread:3156467 [wandb_run.py:_redirect():2401] Redirects installed.
26
+ 2024-10-23 19:53:33,164 INFO MainThread:3156467 [wandb_init.py:init():911] run started, returning control to user process
27
+ 2024-10-24 06:50:25,922 INFO MainThread:3156467 [wandb_run.py:_finish():2158] finishing run 524339208/align-anything/5p9x2ymn
28
+ 2024-10-24 06:50:25,925 INFO MainThread:3156467 [wandb_run.py:_atexit_cleanup():2426] got exitcode: 0
29
+ 2024-10-24 06:50:25,926 INFO MainThread:3156467 [wandb_run.py:_restore():2408] restore
30
+ 2024-10-24 06:50:25,926 INFO MainThread:3156467 [wandb_run.py:_restore():2414] restore done
31
+ 2024-10-24 06:50:29,011 INFO MainThread:3156467 [wandb_run.py:_footer_history_summary_info():3975] rendering history
32
+ 2024-10-24 06:50:29,013 INFO MainThread:3156467 [wandb_run.py:_footer_history_summary_info():4007] rendering summary
33
+ 2024-10-24 06:50:29,023 INFO MainThread:3156467 [wandb_run.py:_footer_sync_info():3934] logging synced files
wandb/run-20241023_195332-5p9x2ymn/run-5p9x2ymn.wandb ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9ef8765b2bc94497d75df8cfc1c02fc8619a3814ba00264199d8e8797d5cde3a
3
+ size 46445978