htlou commited on
Commit
ae1b277
1 Parent(s): f19e1e5

Upload folder using huggingface_hub

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
Files changed (50) hide show
  1. .gitattributes +1 -0
  2. added_tokens.json +16 -0
  3. arguments.yaml +51 -0
  4. chat_template.json +3 -0
  5. config.json +48 -0
  6. environ.txt +178 -0
  7. merges.txt +0 -0
  8. preprocessor_config.json +29 -0
  9. pytorch_model.bin +3 -0
  10. script.sh +74 -0
  11. special_tokens_map.json +45 -0
  12. tokenizer.json +0 -0
  13. tokenizer_config.json +160 -0
  14. vocab.json +0 -0
  15. wandb/debug-internal.log +0 -0
  16. wandb/debug.log +29 -0
  17. wandb/run-20240921_050939-9z0w7l09/files/conda-environment.yaml +516 -0
  18. wandb/run-20240921_050939-9z0w7l09/files/config.yaml +112 -0
  19. wandb/run-20240921_050939-9z0w7l09/files/output.log +206 -0
  20. wandb/run-20240921_050939-9z0w7l09/files/requirements.txt +325 -0
  21. wandb/run-20240921_050939-9z0w7l09/files/wandb-metadata.json +1215 -0
  22. wandb/run-20240921_050939-9z0w7l09/files/wandb-summary.json +1 -0
  23. wandb/run-20240921_050939-9z0w7l09/logs/debug-internal.log +0 -0
  24. wandb/run-20240921_050939-9z0w7l09/logs/debug.log +36 -0
  25. wandb/run-20240921_050939-9z0w7l09/run-9z0w7l09.wandb +0 -0
  26. wandb/run-20240921_103042-1p62y7m7/files/conda-environment.yaml +516 -0
  27. wandb/run-20240921_103042-1p62y7m7/files/config.yaml +111 -0
  28. wandb/run-20240921_103042-1p62y7m7/files/output.log +193 -0
  29. wandb/run-20240921_103042-1p62y7m7/files/requirements.txt +325 -0
  30. wandb/run-20240921_103042-1p62y7m7/files/wandb-metadata.json +1215 -0
  31. wandb/run-20240921_103042-1p62y7m7/files/wandb-summary.json +1 -0
  32. wandb/run-20240921_103042-1p62y7m7/logs/debug-internal.log +0 -0
  33. wandb/run-20240921_103042-1p62y7m7/logs/debug.log +29 -0
  34. wandb/run-20240921_103042-1p62y7m7/run-1p62y7m7.wandb +0 -0
  35. wandb/run-20240921_111222-4ony16ec/files/conda-environment.yaml +516 -0
  36. wandb/run-20240921_111222-4ony16ec/files/config.yaml +112 -0
  37. wandb/run-20240921_111222-4ony16ec/files/output.log +609 -0
  38. wandb/run-20240921_111222-4ony16ec/files/requirements.txt +325 -0
  39. wandb/run-20240921_111222-4ony16ec/files/wandb-metadata.json +1215 -0
  40. wandb/run-20240921_111222-4ony16ec/files/wandb-summary.json +1 -0
  41. wandb/run-20240921_111222-4ony16ec/logs/debug-internal.log +0 -0
  42. wandb/run-20240921_111222-4ony16ec/logs/debug.log +36 -0
  43. wandb/run-20240921_111222-4ony16ec/run-4ony16ec.wandb +3 -0
  44. wandb/run-20240921_115259-p9bvnzls/files/conda-environment.yaml +516 -0
  45. wandb/run-20240921_115259-p9bvnzls/files/config.yaml +111 -0
  46. wandb/run-20240921_115259-p9bvnzls/files/output.log +190 -0
  47. wandb/run-20240921_115259-p9bvnzls/files/requirements.txt +325 -0
  48. wandb/run-20240921_115259-p9bvnzls/files/wandb-metadata.json +1215 -0
  49. wandb/run-20240921_115259-p9bvnzls/files/wandb-summary.json +1 -0
  50. wandb/run-20240921_115259-p9bvnzls/logs/debug-internal.log +0 -0
.gitattributes CHANGED
@@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
 
 
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
+ wandb/run-20240921_111222-4ony16ec/run-4ony16ec.wandb filter=lfs diff=lfs merge=lfs -text
added_tokens.json ADDED
@@ -0,0 +1,16 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "<|box_end|>": 151649,
3
+ "<|box_start|>": 151648,
4
+ "<|endoftext|>": 151643,
5
+ "<|im_end|>": 151645,
6
+ "<|im_start|>": 151644,
7
+ "<|image_pad|>": 151655,
8
+ "<|object_ref_end|>": 151647,
9
+ "<|object_ref_start|>": 151646,
10
+ "<|quad_end|>": 151651,
11
+ "<|quad_start|>": 151650,
12
+ "<|video_pad|>": 151656,
13
+ "<|vision_end|>": 151653,
14
+ "<|vision_pad|>": 151654,
15
+ "<|vision_start|>": 151652
16
+ }
arguments.yaml ADDED
@@ -0,0 +1,51 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ data_cfgs:
2
+ eval_data_files: null
3
+ eval_datasets: null
4
+ eval_optional_args: []
5
+ eval_size: null
6
+ eval_split: null
7
+ eval_subset: null
8
+ eval_template: null
9
+ train_data_files: extracted_preference_1.5k_washed.json
10
+ train_datasets: /aifs4su/yaodong/datasets/aaa_dataset/TV2T-preference/extracted
11
+ train_optional_args: []
12
+ train_size: null
13
+ train_split: train
14
+ train_subset: null
15
+ train_template: NExTQA_preference
16
+ logger_cfgs:
17
+ cache_dir: null
18
+ log_project: align-anything
19
+ log_run_name: dpo
20
+ log_type: wandb
21
+ output_dir: ../outputs/dpo_tiv2t_1.5k_base
22
+ save_interval: 100000
23
+ model_cfgs:
24
+ model_max_length: 4096
25
+ model_name_or_path: /aifs4su/yaodong/models/Qwen2-VL-7B-Instruct
26
+ trust_remote_code: true
27
+ special_tokens: null
28
+ train_cfgs:
29
+ adam_betas:
30
+ - 0.9
31
+ - 0.95
32
+ bf16: true
33
+ ds_cfgs: ds_z3_config.json
34
+ epochs: 3
35
+ eval_interval: 10
36
+ eval_strategy: epoch
37
+ fp16: false
38
+ freeze_language_model: false
39
+ freeze_mm_proj: false
40
+ freeze_vision_tower: true
41
+ gradient_accumulation_steps: 1.0
42
+ gradient_checkpointing: true
43
+ learning_rate: 1.0e-06
44
+ lr_scheduler_type: cosine
45
+ lr_warmup_ratio: 0.01
46
+ per_device_eval_batch_size: 1.0
47
+ per_device_train_batch_size: 1.0
48
+ regularization: 0.001
49
+ scale_coeff: 0.1
50
+ seed: 42
51
+ weight_decay: 0.0
chat_template.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ {
2
+ "chat_template": "{% set image_count = namespace(value=0) %}{% set video_count = namespace(value=0) %}{% for message in messages %}{% if loop.first and message['role'] != 'system' %}<|im_start|>system\nYou are a helpful assistant.<|im_end|>\n{% endif %}<|im_start|>{{ message['role'] }}\n{% if message['content'] is string %}{{ message['content'] }}<|im_end|>\n{% else %}{% for content in message['content'] %}{% if content['type'] == 'image' or 'image' in content or 'image_url' in content %}{% set image_count.value = image_count.value + 1 %}{% if add_vision_id %}Picture {{ image_count.value }}: {% endif %}<|vision_start|><|image_pad|><|vision_end|>{% elif content['type'] == 'video' or 'video' in content %}{% set video_count.value = video_count.value + 1 %}{% if add_vision_id %}Video {{ video_count.value }}: {% endif %}<|vision_start|><|video_pad|><|vision_end|>{% elif 'text' in content %}{{ content['text'] }}{% endif %}{% endfor %}<|im_end|>\n{% endif %}{% endfor %}{% if add_generation_prompt %}<|im_start|>assistant\n{% endif %}"
3
+ }
config.json ADDED
@@ -0,0 +1,48 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "/aifs4su/yaodong/models/Qwen2-VL-7B-Instruct",
3
+ "architectures": [
4
+ "Qwen2VLForConditionalGeneration"
5
+ ],
6
+ "attention_dropout": 0.0,
7
+ "bos_token_id": 128245,
8
+ "eos_token_id": 151645,
9
+ "hidden_act": "silu",
10
+ "hidden_size": 3584,
11
+ "image_token_id": 151655,
12
+ "initializer_range": 0.02,
13
+ "intermediate_size": 18944,
14
+ "max_position_embeddings": 32768,
15
+ "max_window_layers": 28,
16
+ "model_type": "qwen2_vl",
17
+ "num_attention_heads": 28,
18
+ "num_hidden_layers": 28,
19
+ "num_key_value_heads": 4,
20
+ "pad_token_id": 151643,
21
+ "rms_norm_eps": 1e-06,
22
+ "rope_scaling": {
23
+ "mrope_section": [
24
+ 16,
25
+ 24,
26
+ 24
27
+ ],
28
+ "rope_type": "default",
29
+ "type": "default"
30
+ },
31
+ "rope_theta": 1000000.0,
32
+ "sliding_window": 32768,
33
+ "tie_word_embeddings": false,
34
+ "torch_dtype": "bfloat16",
35
+ "transformers_version": "4.45.0.dev0",
36
+ "use_cache": true,
37
+ "use_sliding_window": false,
38
+ "video_token_id": 151656,
39
+ "vision_config": {
40
+ "in_chans": 3,
41
+ "model_type": "qwen2_vl",
42
+ "spatial_patch_size": 14
43
+ },
44
+ "vision_end_token_id": 151653,
45
+ "vision_start_token_id": 151652,
46
+ "vision_token_id": 151654,
47
+ "vocab_size": 151657
48
+ }
environ.txt ADDED
@@ -0,0 +1,178 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ BASH_FUNC__module_raw%%=() { unset _mlshdbg;
2
+ if [ "${MODULES_SILENT_SHELL_DEBUG:-0}" = '1' ]; then
3
+ case "$-" in
4
+ *v*x*)
5
+ set +vx;
6
+ _mlshdbg='vx'
7
+ ;;
8
+ *v*)
9
+ set +v;
10
+ _mlshdbg='v'
11
+ ;;
12
+ *x*)
13
+ set +x;
14
+ _mlshdbg='x'
15
+ ;;
16
+ *)
17
+ _mlshdbg=''
18
+ ;;
19
+ esac;
20
+ fi;
21
+ unset _mlre _mlIFS;
22
+ if [ -n "${IFS+x}" ]; then
23
+ _mlIFS=$IFS;
24
+ fi;
25
+ IFS=' ';
26
+ for _mlv in ${MODULES_RUN_QUARANTINE:-};
27
+ do
28
+ if [ "${_mlv}" = "${_mlv##*[!A-Za-z0-9_]}" -a "${_mlv}" = "${_mlv#[0-9]}" ]; then
29
+ if [ -n "`eval 'echo ${'$_mlv'+x}'`" ]; then
30
+ _mlre="${_mlre:-}${_mlv}_modquar='`eval 'echo ${'$_mlv'}'`' ";
31
+ fi;
32
+ _mlrv="MODULES_RUNENV_${_mlv}";
33
+ _mlre="${_mlre:-}${_mlv}='`eval 'echo ${'$_mlrv':-}'`' ";
34
+ fi;
35
+ done;
36
+ if [ -n "${_mlre:-}" ]; then
37
+ eval `eval ${_mlre} /usr/bin/tclsh /cm/local/apps/environment-modules/4.5.3/libexec/modulecmd.tcl bash '"$@"'`;
38
+ else
39
+ eval `/usr/bin/tclsh /cm/local/apps/environment-modules/4.5.3/libexec/modulecmd.tcl bash "$@"`;
40
+ fi;
41
+ _mlstatus=$?;
42
+ if [ -n "${_mlIFS+x}" ]; then
43
+ IFS=$_mlIFS;
44
+ else
45
+ unset IFS;
46
+ fi;
47
+ unset _mlre _mlv _mlrv _mlIFS;
48
+ if [ -n "${_mlshdbg:-}" ]; then
49
+ set -$_mlshdbg;
50
+ fi;
51
+ unset _mlshdbg;
52
+ return $_mlstatus
53
+ }
54
+ BASH_FUNC_ml%%=() { module ml "$@"
55
+ }
56
+ BASH_FUNC_module%%=() { _module_raw "$@" 2>&1
57
+ }
58
+ BASH_FUNC_switchml%%=() { typeset swfound=1;
59
+ if [ "${MODULES_USE_COMPAT_VERSION:-0}" = '1' ]; then
60
+ typeset swname='main';
61
+ if [ -e /cm/local/apps/environment-modules/4.5.3/libexec/modulecmd.tcl ]; then
62
+ typeset swfound=0;
63
+ unset MODULES_USE_COMPAT_VERSION;
64
+ fi;
65
+ else
66
+ typeset swname='compatibility';
67
+ if [ -e /cm/local/apps/environment-modules/4.5.3/libexec/modulecmd-compat ]; then
68
+ typeset swfound=0;
69
+ MODULES_USE_COMPAT_VERSION=1;
70
+ export MODULES_USE_COMPAT_VERSION;
71
+ fi;
72
+ fi;
73
+ if [ $swfound -eq 0 ]; then
74
+ echo "Switching to Modules $swname version";
75
+ source /cm/local/apps/environment-modules/4.5.3/init/bash;
76
+ else
77
+ echo "Cannot switch to Modules $swname version, command not found";
78
+ return 1;
79
+ fi
80
+ }
81
+ BROWSER=/home/yangyaodong/.vscode-server/cli/servers/Stable-38c31bc77e0dd6ae88a4e9cc93428cc27a56ba40/server/bin/helpers/browser.sh
82
+ CMD_WLM_CLUSTER_NAME=slurm
83
+ COLORTERM=truecolor
84
+ CONDA_DEFAULT_ENV=hantao_tiv
85
+ CONDA_EXE=/aifs4su/yaodong/miniconda3/bin/conda
86
+ CONDA_MKL_INTERFACE_LAYER_BACKUP=
87
+ CONDA_PREFIX=/aifs4su/yaodong/miniconda3/envs/hantao_tiv
88
+ CONDA_PREFIX_1=/aifs4su/yaodong/miniconda3
89
+ CONDA_PREFIX_2=/aifs4su/yaodong/miniconda3/envs/hantao_new
90
+ CONDA_PROMPT_MODIFIER=(hantao_tiv)
91
+ CONDA_PYTHON_EXE=/aifs4su/yaodong/miniconda3/bin/python
92
+ CONDA_SHLVL=3
93
+ CPATH=/cm/shared/apps/slurm/current/include
94
+ CPATH_modshare=/cm/shared/apps/slurm/current/include:1
95
+ CROSS_RANK=0
96
+ CROSS_SIZE=1
97
+ CUDA_HOME=/aifs4su/yaodong/miniconda3/envs/hantao_tiv
98
+ CUDA_MODULE_LOADING=LAZY
99
+ CUDA_VISIBLE_DEVICES=0,1,2,3,4,5,6,7
100
+ DBUS_SESSION_BUS_ADDRESS=unix:path=/run/user/1028/bus
101
+ ENABLE_LMOD=0
102
+ GIT_ASKPASS=/home/yangyaodong/.vscode-server/cli/servers/Stable-38c31bc77e0dd6ae88a4e9cc93428cc27a56ba40/server/extensions/git/dist/askpass.sh
103
+ GSETTINGS_SCHEMA_DIR=/aifs4su/yaodong/miniconda3/envs/hantao_tiv/share/glib-2.0/schemas
104
+ GSETTINGS_SCHEMA_DIR_CONDA_BACKUP=
105
+ HOME=/home/yangyaodong
106
+ KMP_DUPLICATE_LIB_OK=True
107
+ KMP_INIT_AT_FORK=FALSE
108
+ LANG=C.UTF-8
109
+ LD_LIBRARY_PATH=/usr/local/cuda/lib64:/usr/mpi/gcc/openmpi-4.1.7a1/lib:/usr/local/cuda/lib64:/usr/local/cuda/lib64:/cm/shared/apps/slurm/current/lib64/slurm:/cm/shared/apps/slurm/current/lib64
110
+ LD_LIBRARY_PATH_modshare=/cm/shared/apps/slurm/current/lib64:1:/usr/mpi/gcc/openmpi-4.1.7a1/lib:1:/cm/shared/apps/slurm/current/lib64/slurm:1:/usr/local/cuda/lib64:1
111
+ LD_RUN_PATH=/usr/mpi/gcc/openmpi-4.1.7a1/lib
112
+ LD_RUN_PATH_modshare=/usr/mpi/gcc/openmpi-4.1.7a1/lib:1
113
+ LESSCLOSE=/usr/bin/lesspipe %s %s
114
+ LESSOPEN=| /usr/bin/lesspipe %s
115
+ LIBRARY_PATH=/cm/shared/apps/slurm/current/lib64/slurm:/cm/shared/apps/slurm/current/lib64
116
+ LIBRARY_PATH_modshare=/cm/shared/apps/slurm/current/lib64:1:/cm/shared/apps/slurm/current/lib64/slurm:1
117
+ LOADEDMODULES=slurm/slurm/23.02.6:gcc/64/4.1.7a1
118
+ LOADEDMODULES_modshare=slurm/slurm/23.02.6:1:gcc/64/4.1.7a1:1
119
+ LOCAL_RANK=0
120
+ LOCAL_SIZE=8
121
+ LOGLEVEL=WARNING
122
+ LOGNAME=yangyaodong
123
+ LS_COLORS=rs=0:di=01;34:ln=01;36:mh=00:pi=40;33:so=01;35:do=01;35:bd=40;33;01:cd=40;33;01:or=40;31;01:mi=00:su=37;41:sg=30;43:ca=30;41:tw=30;42:ow=34;42:st=37;44:ex=01;32:*.tar=01;31:*.tgz=01;31:*.arc=01;31:*.arj=01;31:*.taz=01;31:*.lha=01;31:*.lz4=01;31:*.lzh=01;31:*.lzma=01;31:*.tlz=01;31:*.txz=01;31:*.tzo=01;31:*.t7z=01;31:*.zip=01;31:*.z=01;31:*.dz=01;31:*.gz=01;31:*.lrz=01;31:*.lz=01;31:*.lzo=01;31:*.xz=01;31:*.zst=01;31:*.tzst=01;31:*.bz2=01;31:*.bz=01;31:*.tbz=01;31:*.tbz2=01;31:*.tz=01;31:*.deb=01;31:*.rpm=01;31:*.jar=01;31:*.war=01;31:*.ear=01;31:*.sar=01;31:*.rar=01;31:*.alz=01;31:*.ace=01;31:*.zoo=01;31:*.cpio=01;31:*.7z=01;31:*.rz=01;31:*.cab=01;31:*.wim=01;31:*.swm=01;31:*.dwm=01;31:*.esd=01;31:*.jpg=01;35:*.jpeg=01;35:*.mjpg=01;35:*.mjpeg=01;35:*.gif=01;35:*.bmp=01;35:*.pbm=01;35:*.pgm=01;35:*.ppm=01;35:*.tga=01;35:*.xbm=01;35:*.xpm=01;35:*.tif=01;35:*.tiff=01;35:*.png=01;35:*.svg=01;35:*.svgz=01;35:*.mng=01;35:*.pcx=01;35:*.mov=01;35:*.mpg=01;35:*.mpeg=01;35:*.m2v=01;35:*.mkv=01;35:*.webm=01;35:*.webp=01;35:*.ogm=01;35:*.mp4=01;35:*.m4v=01;35:*.mp4v=01;35:*.vob=01;35:*.qt=01;35:*.nuv=01;35:*.wmv=01;35:*.asf=01;35:*.rm=01;35:*.rmvb=01;35:*.flc=01;35:*.avi=01;35:*.fli=01;35:*.flv=01;35:*.gl=01;35:*.dl=01;35:*.xcf=01;35:*.xwd=01;35:*.yuv=01;35:*.cgm=01;35:*.emf=01;35:*.ogv=01;35:*.ogx=01;35:*.aac=00;36:*.au=00;36:*.flac=00;36:*.m4a=00;36:*.mid=00;36:*.midi=00;36:*.mka=00;36:*.mp3=00;36:*.mpc=00;36:*.ogg=00;36:*.ra=00;36:*.wav=00;36:*.oga=00;36:*.opus=00;36:*.spx=00;36:*.xspf=00;36:
124
+ MANPATH=/usr/mpi/gcc/openmpi-4.1.7a1/share/man:/cm/shared/apps/slurm/current/man:/cm/local/apps/environment-modules/4.5.3/share/man:/usr/local/man:/usr/local/share/man:/usr/share/man:/cm/local/apps/environment-modules/current/share/man:/cm/local/apps/environment-modules/current/share/man:/cm/local/apps/environment-modules/current/share/man
125
+ MANPATH_modshare=/usr/local/share/man:1:/usr/mpi/gcc/openmpi-4.1.7a1/share/man:1:/cm/local/apps/environment-modules/current/share/man:1:/cm/local/apps/environment-modules/4.5.3/share/man:1:/usr/local/man:1:/usr/share/man:1:/cm/shared/apps/slurm/current/man:1
126
+ MASTER_ADDR=127.0.0.1
127
+ MASTER_PORT=16688
128
+ MIG_PARTED_CHECKPOINT_FILE=/var/lib/nvidia-mig-manager/checkpoint.json
129
+ MIG_PARTED_CONFIG_FILE=/etc/nvidia-mig-manager/config.yaml
130
+ MIG_PARTED_HOOKS_FILE=/etc/nvidia-mig-manager/hooks.yaml
131
+ MKL_INTERFACE_LAYER=LP64,GNU
132
+ MODULEPATH=/cm/local/modulefiles:/cm/shared/modulefiles
133
+ MODULESHOME=/cm/local/apps/environment-modules/4.5.3
134
+ MODULES_CMD=/cm/local/apps/environment-modules/4.5.3/libexec/modulecmd.tcl
135
+ MODULES_SET_SHELL_STARTUP=0
136
+ MOTD_SHOWN=pam
137
+ MPI_HOME=/usr/mpi/gcc/openmpi-4.1.7a1
138
+ MPI_RUN=/usr/mpi/gcc/openmpi-4.1.7a1/bin/mpirun
139
+ OLDPWD=/home/yangyaodong
140
+ PATH=/home/yangyaodong/.local/bin:/usr/local/cuda/bin:/usr/lpp/mmfs/bin:/usr/local/cuda/bin:/opt/bin:/home/yangyaodong/.local/bin:/aifs4su/yaodong/google-cloud-sdk/bin:/aifs4su/yaodong/miniconda3/envs/hantao_tiv/bin:/aifs4su/yaodong/miniconda3/condabin:/usr/mpi/gcc/openmpi-4.1.7a1/bin:/usr/local/cuda/bin:/usr/lpp/mmfs/bin:/cm/shared/apps/slurm/current/sbin:/cm/shared/apps/slurm/current/bin:/usr/local/cuda/bin:/opt/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin:/usr/games:/usr/local/games:/snap/bin:/sbin:/usr/sbin:/cm/local/apps/environment-modules/4.5.3/bin
141
+ PATH_modshare=/usr/mpi/gcc/openmpi-4.1.7a1/bin:1:/opt/bin/:1:/usr/bin:1:/usr/local/bin:1:/cm/shared/apps/slurm/current/bin:1:/cm/shared/apps/slurm/current/sbin:1:/bin:1:/snap/bin:1:/sbin:1:/home/yangyaodong/.vscode-server/cli/servers/Stable-38c31bc77e0dd6ae88a4e9cc93428cc27a56ba40/server/bin/remote-cli:1:/usr/sbin:1:/cm/local/apps/environment-modules/4.5.3/bin:1:/usr/games:1:/usr/local/sbin:1:/usr/lpp/mmfs/bin:1:/usr/local/cuda/bin:1:/usr/local/games:1
142
+ PWD=/aifs4su/yaodong/projects/hantao/dev_cham/align-anything/scripts
143
+ PYTHONHASHSEED=42
144
+ PYTHONPATH=/aifs4su/yaodong/projects/hantao/dev_cham/align-anything:/aifs4su/yaodong/projects/hantao/dev_cham/align-anything
145
+ RANK=0
146
+ SHELL=/bin/bash
147
+ SHLVL=5
148
+ SLURM_CONF=/cm/shared/apps/slurm/var/etc/slurm/slurm.conf
149
+ SSH_CLIENT=10.33.4.51 60672 22
150
+ SSH_CONNECTION=10.33.4.51 35276 10.33.5.36 22
151
+ SSL_CERT_DIR=/usr/lib/ssl/certs
152
+ SSL_CERT_FILE=/usr/lib/ssl/certs/ca-certificates.crt
153
+ TERM=screen
154
+ TERM_PROGRAM=tmux
155
+ TERM_PROGRAM_VERSION=3.2a
156
+ TMUX=/tmp/tmux-1028/default,1661839,139
157
+ TMUX_PANE=%139
158
+ TRITON_CACHE_DIR=/aifs4su/yaodong/cache/triton
159
+ USER=yangyaodong
160
+ VSCODE_GIT_ASKPASS_EXTRA_ARGS=
161
+ VSCODE_GIT_ASKPASS_MAIN=/home/yangyaodong/.vscode-server/cli/servers/Stable-38c31bc77e0dd6ae88a4e9cc93428cc27a56ba40/server/extensions/git/dist/askpass-main.js
162
+ VSCODE_GIT_ASKPASS_NODE=/home/yangyaodong/.vscode-server/cli/servers/Stable-38c31bc77e0dd6ae88a4e9cc93428cc27a56ba40/server/node
163
+ VSCODE_GIT_IPC_HANDLE=/run/user/1028/vscode-git-ba18af3aed.sock
164
+ VSCODE_IPC_HOOK_CLI=/run/user/1028/vscode-ipc-57558741-0df8-4930-ba26-d5e7527b0cd8.sock
165
+ WANDB_API_KEY=547f38af44135ca76a4f4eed9c8d135532da4960
166
+ WANDB_SERVICE=2-1311189-tcp-localhost-38981
167
+ WORLD_SIZE=8
168
+ XDG_DATA_DIRS=/usr/local/share:/usr/share:/var/lib/snapd/desktop
169
+ XDG_RUNTIME_DIR=/run/user/1028
170
+ XDG_SESSION_CLASS=user
171
+ XDG_SESSION_ID=2362
172
+ XDG_SESSION_TYPE=tty
173
+ XML_CATALOG_FILES=file:///aifs4su/yaodong/miniconda3/envs/hantao_tiv/etc/xml/catalog file:///etc/xml/catalog
174
+ _=/aifs4su/yaodong/miniconda3/envs/hantao_tiv/bin/deepspeed
175
+ _CE_CONDA=
176
+ _CE_M=
177
+ _LMFILES_=/cm/local/modulefiles/slurm/slurm/23.02.6:/cm/local/modulefiles/gcc/64/4.1.7a1
178
+ _LMFILES__modshare=/cm/local/modulefiles/slurm/slurm/23.02.6:1:/cm/local/modulefiles/gcc/64/4.1.7a1:1
merges.txt ADDED
The diff for this file is too large to render. See raw diff
 
preprocessor_config.json ADDED
@@ -0,0 +1,29 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "do_convert_rgb": true,
3
+ "do_normalize": true,
4
+ "do_rescale": true,
5
+ "do_resize": true,
6
+ "image_mean": [
7
+ 0.48145466,
8
+ 0.4578275,
9
+ 0.40821073
10
+ ],
11
+ "image_processor_type": "Qwen2VLImageProcessor",
12
+ "image_std": [
13
+ 0.26862954,
14
+ 0.26130258,
15
+ 0.27577711
16
+ ],
17
+ "max_pixels": 1003520,
18
+ "merge_size": 2,
19
+ "min_pixels": 3136,
20
+ "patch_size": 14,
21
+ "processor_class": "Qwen2VLProcessor",
22
+ "resample": 3,
23
+ "rescale_factor": 0.00392156862745098,
24
+ "size": {
25
+ "max_pixels": 1003520,
26
+ "min_pixels": 3136
27
+ },
28
+ "temporal_patch_size": 2
29
+ }
pytorch_model.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a4f7d3d8412de5afaa7d62729bd2e5112c53cd04082eeac24c897e27382ae616
3
+ size 16577151950
script.sh ADDED
@@ -0,0 +1,74 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ #!/usr/bin/env bash
2
+ #
3
+ # Copyright 2024 PKU-Alignment Team. All Rights Reserved.
4
+ #
5
+ # Licensed under the Apache License, Version 2.0 (the "License");
6
+ # you may not use this file except in compliance with the License.
7
+ # You may obtain a copy of the License at
8
+ #
9
+ # http://www.apache.org/licenses/LICENSE-2.0
10
+ #
11
+ # Unless required by applicable law or agreed to in writing, software
12
+ # distributed under the License is distributed on an "AS IS" BASIS,
13
+ # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
14
+ # See the License for the specific language governing permissions and
15
+ # limitations under the License.
16
+ # ==============================================================================
17
+
18
+ export TRITON_CACHE_DIR="/aifs4su/yaodong/cache/triton"
19
+ # You can replace it with a local model path
20
+ MODEL_NAME_OR_PATH="/aifs4su/yaodong/models/Qwen2-VL-7B-Instruct"
21
+ # You can replace it with a local dataset path
22
+ TRAIN_DATASETS="/aifs4su/yaodong/projects/hantao/lang_feedback/video/outputs"
23
+ EVAL_DATASETS="/aifs4su/yaodong/datasets/ShareGPTVideo/extracted/split"
24
+ # You can replace it with a new path
25
+ OUTPUT_DIR="../outputs/dpo_tiv2t_1.5k_cai"
26
+ # For wandb online logging
27
+ export WANDB_API_KEY="547f38af44135ca76a4f4eed9c8d135532da4960"
28
+ # Source the setup script
29
+ source ./setup.sh
30
+
31
+ export CUDA_HOME=$CONDA_PREFIX
32
+
33
+ # Execute deepspeed command
34
+ deepspeed \
35
+ --master_port ${MASTER_PORT} \
36
+ --module align_anything.trainers.tiv_to_t.dpo \
37
+ --model_name_or_path ${MODEL_NAME_OR_PATH} \
38
+ --train_datasets ${TRAIN_DATASETS} \
39
+ --output_dir ${OUTPUT_DIR} \
40
+ --train_data_files cai_gen_outputs_batch_gen_washed_valid_clean_same.json \
41
+ --train_template NExTQA_preference \
42
+ --train_split 'train' \
43
+ --per_device_train_batch_size 1 \
44
+ --per_device_eval_batch_size 1 \
45
+ --gradient_accumulation_steps 1
46
+
47
+ export TRITON_CACHE_DIR="/aifs4su/yaodong/cache/triton"
48
+ # You can replace it with a local model path
49
+ MODEL_NAME_OR_PATH="/aifs4su/yaodong/models/Qwen2-VL-7B-Instruct"
50
+ # You can replace it with a local dataset path
51
+ TRAIN_DATASETS="/aifs4su/yaodong/datasets/aaa_dataset/TV2T-preference/extracted"
52
+ EVAL_DATASETS="/aifs4su/yaodong/datasets/ShareGPTVideo/extracted/split"
53
+ # You can replace it with a new path
54
+ OUTPUT_DIR="../outputs/dpo_tiv2t_1.5k_base"
55
+ # For wandb online logging
56
+ export WANDB_API_KEY="547f38af44135ca76a4f4eed9c8d135532da4960"
57
+ # Source the setup script
58
+ source ./setup.sh
59
+
60
+ export CUDA_HOME=$CONDA_PREFIX
61
+
62
+ # Execute deepspeed command
63
+ deepspeed \
64
+ --master_port ${MASTER_PORT} \
65
+ --module align_anything.trainers.tiv_to_t.dpo \
66
+ --model_name_or_path ${MODEL_NAME_OR_PATH} \
67
+ --train_datasets ${TRAIN_DATASETS} \
68
+ --output_dir ${OUTPUT_DIR} \
69
+ --train_data_files extracted_preference_1.5k_washed.json \
70
+ --train_template NExTQA_preference \
71
+ --train_split 'train' \
72
+ --per_device_train_batch_size 1 \
73
+ --per_device_eval_batch_size 1 \
74
+ --gradient_accumulation_steps 1
special_tokens_map.json ADDED
@@ -0,0 +1,45 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "additional_special_tokens": [
3
+ "<|im_start|>",
4
+ "<|im_end|>",
5
+ "<|object_ref_start|>",
6
+ "<|object_ref_end|>",
7
+ "<|box_start|>",
8
+ "<|box_end|>",
9
+ "<|quad_start|>",
10
+ "<|quad_end|>",
11
+ "<|vision_start|>",
12
+ "<|vision_end|>",
13
+ "<|vision_pad|>",
14
+ "<|image_pad|>",
15
+ "<|video_pad|>"
16
+ ],
17
+ "bos_token": {
18
+ "content": "<s>",
19
+ "lstrip": false,
20
+ "normalized": false,
21
+ "rstrip": false,
22
+ "single_word": false
23
+ },
24
+ "eos_token": {
25
+ "content": "<|im_end|>",
26
+ "lstrip": false,
27
+ "normalized": false,
28
+ "rstrip": false,
29
+ "single_word": false
30
+ },
31
+ "pad_token": {
32
+ "content": "<|endoftext|>",
33
+ "lstrip": false,
34
+ "normalized": false,
35
+ "rstrip": false,
36
+ "single_word": false
37
+ },
38
+ "unk_token": {
39
+ "content": "<unk>",
40
+ "lstrip": false,
41
+ "normalized": false,
42
+ "rstrip": false,
43
+ "single_word": false
44
+ }
45
+ }
tokenizer.json ADDED
The diff for this file is too large to render. See raw diff
 
tokenizer_config.json ADDED
@@ -0,0 +1,160 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "add_prefix_space": false,
3
+ "added_tokens_decoder": {
4
+ "128244": {
5
+ "content": "<unk>",
6
+ "lstrip": false,
7
+ "normalized": false,
8
+ "rstrip": false,
9
+ "single_word": false,
10
+ "special": true
11
+ },
12
+ "128245": {
13
+ "content": "<s>",
14
+ "lstrip": false,
15
+ "normalized": false,
16
+ "rstrip": false,
17
+ "single_word": false,
18
+ "special": true
19
+ },
20
+ "151643": {
21
+ "content": "<|endoftext|>",
22
+ "lstrip": false,
23
+ "normalized": false,
24
+ "rstrip": false,
25
+ "single_word": false,
26
+ "special": true
27
+ },
28
+ "151644": {
29
+ "content": "<|im_start|>",
30
+ "lstrip": false,
31
+ "normalized": false,
32
+ "rstrip": false,
33
+ "single_word": false,
34
+ "special": true
35
+ },
36
+ "151645": {
37
+ "content": "<|im_end|>",
38
+ "lstrip": false,
39
+ "normalized": false,
40
+ "rstrip": false,
41
+ "single_word": false,
42
+ "special": true
43
+ },
44
+ "151646": {
45
+ "content": "<|object_ref_start|>",
46
+ "lstrip": false,
47
+ "normalized": false,
48
+ "rstrip": false,
49
+ "single_word": false,
50
+ "special": true
51
+ },
52
+ "151647": {
53
+ "content": "<|object_ref_end|>",
54
+ "lstrip": false,
55
+ "normalized": false,
56
+ "rstrip": false,
57
+ "single_word": false,
58
+ "special": true
59
+ },
60
+ "151648": {
61
+ "content": "<|box_start|>",
62
+ "lstrip": false,
63
+ "normalized": false,
64
+ "rstrip": false,
65
+ "single_word": false,
66
+ "special": true
67
+ },
68
+ "151649": {
69
+ "content": "<|box_end|>",
70
+ "lstrip": false,
71
+ "normalized": false,
72
+ "rstrip": false,
73
+ "single_word": false,
74
+ "special": true
75
+ },
76
+ "151650": {
77
+ "content": "<|quad_start|>",
78
+ "lstrip": false,
79
+ "normalized": false,
80
+ "rstrip": false,
81
+ "single_word": false,
82
+ "special": true
83
+ },
84
+ "151651": {
85
+ "content": "<|quad_end|>",
86
+ "lstrip": false,
87
+ "normalized": false,
88
+ "rstrip": false,
89
+ "single_word": false,
90
+ "special": true
91
+ },
92
+ "151652": {
93
+ "content": "<|vision_start|>",
94
+ "lstrip": false,
95
+ "normalized": false,
96
+ "rstrip": false,
97
+ "single_word": false,
98
+ "special": true
99
+ },
100
+ "151653": {
101
+ "content": "<|vision_end|>",
102
+ "lstrip": false,
103
+ "normalized": false,
104
+ "rstrip": false,
105
+ "single_word": false,
106
+ "special": true
107
+ },
108
+ "151654": {
109
+ "content": "<|vision_pad|>",
110
+ "lstrip": false,
111
+ "normalized": false,
112
+ "rstrip": false,
113
+ "single_word": false,
114
+ "special": true
115
+ },
116
+ "151655": {
117
+ "content": "<|image_pad|>",
118
+ "lstrip": false,
119
+ "normalized": false,
120
+ "rstrip": false,
121
+ "single_word": false,
122
+ "special": true
123
+ },
124
+ "151656": {
125
+ "content": "<|video_pad|>",
126
+ "lstrip": false,
127
+ "normalized": false,
128
+ "rstrip": false,
129
+ "single_word": false,
130
+ "special": true
131
+ }
132
+ },
133
+ "additional_special_tokens": [
134
+ "<|im_start|>",
135
+ "<|im_end|>",
136
+ "<|object_ref_start|>",
137
+ "<|object_ref_end|>",
138
+ "<|box_start|>",
139
+ "<|box_end|>",
140
+ "<|quad_start|>",
141
+ "<|quad_end|>",
142
+ "<|vision_start|>",
143
+ "<|vision_end|>",
144
+ "<|vision_pad|>",
145
+ "<|image_pad|>",
146
+ "<|video_pad|>"
147
+ ],
148
+ "bos_token": "<s>",
149
+ "chat_template": "{% set image_count = namespace(value=0) %}{% set video_count = namespace(value=0) %}{% for message in messages %}{% if loop.first and message['role'] != 'system' %}<|im_start|>system\nYou are a helpful assistant.<|im_end|>\n{% endif %}<|im_start|>{{ message['role'] }}\n{% if message['content'] is string %}{{ message['content'] }}<|im_end|>\n{% else %}{% for content in message['content'] %}{% if content['type'] == 'image' or 'image' in content or 'image_url' in content %}{% set image_count.value = image_count.value + 1 %}{% if add_vision_id %}Picture {{ image_count.value }}: {% endif %}<|vision_start|><|image_pad|><|vision_end|>{% elif content['type'] == 'video' or 'video' in content %}{% set video_count.value = video_count.value + 1 %}{% if add_vision_id %}Video {{ video_count.value }}: {% endif %}<|vision_start|><|video_pad|><|vision_end|>{% elif 'text' in content %}{{ content['text'] }}{% endif %}{% endfor %}<|im_end|>\n{% endif %}{% endfor %}{% if add_generation_prompt %}<|im_start|>assistant\n{% endif %}",
150
+ "clean_up_tokenization_spaces": false,
151
+ "eos_token": "<|im_end|>",
152
+ "errors": "replace",
153
+ "model_max_length": 4096,
154
+ "pad_token": "<|endoftext|>",
155
+ "padding_side": "left",
156
+ "processor_class": "Qwen2VLProcessor",
157
+ "split_special_tokens": false,
158
+ "tokenizer_class": "Qwen2Tokenizer",
159
+ "unk_token": "<unk>"
160
+ }
vocab.json ADDED
The diff for this file is too large to render. See raw diff
 
wandb/debug-internal.log ADDED
The diff for this file is too large to render. See raw diff
 
wandb/debug.log ADDED
@@ -0,0 +1,29 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ 2024-09-21 11:52:59,195 INFO MainThread:1311189 [wandb_setup.py:_flush():76] Current SDK version is 0.17.5
2
+ 2024-09-21 11:52:59,196 INFO MainThread:1311189 [wandb_setup.py:_flush():76] Configure stats pid to 1311189
3
+ 2024-09-21 11:52:59,196 INFO MainThread:1311189 [wandb_setup.py:_flush():76] Loading settings from /home/yangyaodong/.config/wandb/settings
4
+ 2024-09-21 11:52:59,196 INFO MainThread:1311189 [wandb_setup.py:_flush():76] Loading settings from /aifs4su/yaodong/projects/hantao/dev_cham/align-anything/scripts/wandb/settings
5
+ 2024-09-21 11:52:59,196 INFO MainThread:1311189 [wandb_setup.py:_flush():76] Loading settings from environment variables: {'api_key': '***REDACTED***'}
6
+ 2024-09-21 11:52:59,196 INFO MainThread:1311189 [wandb_setup.py:_flush():76] Applying setup settings: {'_disable_service': False}
7
+ 2024-09-21 11:52:59,196 WARNING MainThread:1311189 [wandb_setup.py:_flush():76] Could not find program at -m align_anything.trainers.tiv_to_t.dpo
8
+ 2024-09-21 11:52:59,196 INFO MainThread:1311189 [wandb_setup.py:_flush():76] Inferring run settings from compute environment: {'program_relpath': None, 'program': '-m align_anything.trainers.tiv_to_t.dpo'}
9
+ 2024-09-21 11:52:59,196 INFO MainThread:1311189 [wandb_setup.py:_flush():76] Applying login settings: {}
10
+ 2024-09-21 11:52:59,196 INFO MainThread:1311189 [wandb_init.py:_log_setup():529] Logging user logs to ../outputs/dpo_tiv2t_1.5k_base/wandb/run-20240921_115259-p9bvnzls/logs/debug.log
11
+ 2024-09-21 11:52:59,196 INFO MainThread:1311189 [wandb_init.py:_log_setup():530] Logging internal logs to ../outputs/dpo_tiv2t_1.5k_base/wandb/run-20240921_115259-p9bvnzls/logs/debug-internal.log
12
+ 2024-09-21 11:52:59,196 INFO MainThread:1311189 [wandb_init.py:init():569] calling init triggers
13
+ 2024-09-21 11:52:59,197 INFO MainThread:1311189 [wandb_init.py:init():576] wandb.init called with sweep_config: {}
14
+ config: {'train_cfgs': {'ds_cfgs': 'ds_z3_config.json', 'epochs': 3, 'seed': 42, 'per_device_train_batch_size': 1.0, 'per_device_eval_batch_size': 1.0, 'gradient_accumulation_steps': 1.0, 'gradient_checkpointing': True, 'learning_rate': 1e-06, 'lr_scheduler_type': 'cosine', 'lr_warmup_ratio': 0.01, 'weight_decay': 0.0, 'adam_betas': [0.9, 0.95], 'bf16': True, 'fp16': False, 'eval_strategy': 'epoch', 'eval_interval': 10, 'regularization': 0.001, 'scale_coeff': 0.1, 'freeze_mm_proj': False, 'freeze_vision_tower': True, 'freeze_language_model': False}, 'data_cfgs': {'train_datasets': '/aifs4su/yaodong/datasets/aaa_dataset/TV2T-preference/extracted', 'train_template': 'NExTQA_preference', 'train_size': None, 'train_split': 'train', 'train_subset': None, 'train_data_files': 'extracted_preference_1.5k_washed.json', 'train_optional_args': [], 'eval_datasets': None, 'eval_template': None, 'eval_size': None, 'eval_split': None, 'eval_subset': None, 'eval_data_files': None, 'eval_optional_args': []}, 'logger_cfgs': {'log_type': 'wandb', 'log_project': 'align-anything', 'log_run_name': 'dpo', 'output_dir': '../outputs/dpo_tiv2t_1.5k_base', 'cache_dir': None, 'save_interval': 100000}, 'model_cfgs': {'model_name_or_path': '/aifs4su/yaodong/models/Qwen2-VL-7B-Instruct', 'trust_remote_code': True, 'model_max_length': 4096}, 'special_tokens': None}
15
+ 2024-09-21 11:52:59,197 INFO MainThread:1311189 [wandb_init.py:init():619] starting backend
16
+ 2024-09-21 11:52:59,197 INFO MainThread:1311189 [wandb_init.py:init():623] setting up manager
17
+ 2024-09-21 11:52:59,198 INFO MainThread:1311189 [backend.py:_multiprocessing_setup():105] multiprocessing start_methods=fork,spawn,forkserver, using: spawn
18
+ 2024-09-21 11:52:59,201 INFO MainThread:1311189 [wandb_init.py:init():631] backend started and connected
19
+ 2024-09-21 11:52:59,204 INFO MainThread:1311189 [wandb_init.py:init():720] updated telemetry
20
+ 2024-09-21 11:52:59,226 INFO MainThread:1311189 [wandb_init.py:init():753] communicating run to backend with 90.0 second timeout
21
+ 2024-09-21 11:52:59,742 INFO MainThread:1311189 [wandb_run.py:_on_init():2435] communicating current version
22
+ 2024-09-21 11:52:59,955 INFO MainThread:1311189 [wandb_run.py:_on_init():2444] got version response upgrade_message: "wandb version 0.18.1 is available! To upgrade, please run:\n $ pip install wandb --upgrade"
23
+
24
+ 2024-09-21 11:52:59,956 INFO MainThread:1311189 [wandb_init.py:init():804] starting run threads in backend
25
+ 2024-09-21 11:53:06,573 INFO MainThread:1311189 [wandb_run.py:_console_start():2413] atexit reg
26
+ 2024-09-21 11:53:06,574 INFO MainThread:1311189 [wandb_run.py:_redirect():2255] redirect: wrap_raw
27
+ 2024-09-21 11:53:06,574 INFO MainThread:1311189 [wandb_run.py:_redirect():2320] Wrapping output streams.
28
+ 2024-09-21 11:53:06,574 INFO MainThread:1311189 [wandb_run.py:_redirect():2345] Redirects installed.
29
+ 2024-09-21 11:53:06,633 INFO MainThread:1311189 [wandb_init.py:init():847] run started, returning control to user process
wandb/run-20240921_050939-9z0w7l09/files/conda-environment.yaml ADDED
@@ -0,0 +1,516 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ name: hantao_tiv
2
+ channels:
3
+ - nvidia/label/cuda-12.1.0
4
+ - nvidia
5
+ - pytorch
6
+ - huggingface
7
+ - conda-forge
8
+ - defaults
9
+ dependencies:
10
+ - _libgcc_mutex=0.1=conda_forge
11
+ - _openmp_mutex=4.5=2_gnu
12
+ - aom=3.9.1=hac33072_0
13
+ - asttokens=2.4.1=pyhd8ed1ab_0
14
+ - blas=1.0=mkl
15
+ - brotli-python=1.1.0=py311hb755f60_1
16
+ - bzip2=1.0.8=h4bc722e_7
17
+ - ca-certificates=2024.7.4=hbcca054_0
18
+ - cairo=1.18.0=hebfffa5_3
19
+ - certifi=2024.7.4=pyhd8ed1ab_0
20
+ - cffi=1.16.0=py311hb3a22ac_0
21
+ - charset-normalizer=3.3.2=pyhd8ed1ab_0
22
+ - comm=0.2.2=pyhd8ed1ab_0
23
+ - cuda=12.1.0=0
24
+ - cuda-cccl=12.1.55=0
25
+ - cuda-command-line-tools=12.1.0=0
26
+ - cuda-compiler=12.1.0=0
27
+ - cuda-cudart=12.1.55=0
28
+ - cuda-cudart-dev=12.1.55=0
29
+ - cuda-cudart-static=12.1.55=0
30
+ - cuda-cuobjdump=12.1.55=0
31
+ - cuda-cupti=12.1.62=0
32
+ - cuda-cupti-static=12.1.62=0
33
+ - cuda-cuxxfilt=12.1.55=0
34
+ - cuda-demo-suite=12.1.55=0
35
+ - cuda-documentation=12.1.55=0
36
+ - cuda-driver-dev=12.1.55=0
37
+ - cuda-gdb=12.1.55=0
38
+ - cuda-libraries=12.1.0=0
39
+ - cuda-libraries-dev=12.1.0=0
40
+ - cuda-libraries-static=12.1.0=0
41
+ - cuda-nsight=12.1.55=0
42
+ - cuda-nsight-compute=12.1.0=0
43
+ - cuda-nvcc=12.1.66=0
44
+ - cuda-nvdisasm=12.1.55=0
45
+ - cuda-nvml-dev=12.1.55=0
46
+ - cuda-nvprof=12.1.55=0
47
+ - cuda-nvprune=12.1.55=0
48
+ - cuda-nvrtc=12.1.55=0
49
+ - cuda-nvrtc-dev=12.1.55=0
50
+ - cuda-nvrtc-static=12.1.55=0
51
+ - cuda-nvtx=12.1.66=0
52
+ - cuda-nvvp=12.1.55=0
53
+ - cuda-opencl=12.1.56=0
54
+ - cuda-opencl-dev=12.1.56=0
55
+ - cuda-profiler-api=12.1.55=0
56
+ - cuda-runtime=12.1.0=0
57
+ - cuda-sanitizer-api=12.1.55=0
58
+ - cuda-toolkit=12.1.0=0
59
+ - cuda-tools=12.1.0=0
60
+ - cuda-visual-tools=12.1.0=0
61
+ - dav1d=1.2.1=hd590300_0
62
+ - debugpy=1.8.2=py311h4332511_0
63
+ - exceptiongroup=1.2.2=pyhd8ed1ab_0
64
+ - executing=2.0.1=pyhd8ed1ab_0
65
+ - expat=2.6.2=h59595ed_0
66
+ - ffmpeg=7.0.1=gpl_h9be9148_104
67
+ - filelock=3.15.4=pyhd8ed1ab_0
68
+ - font-ttf-dejavu-sans-mono=2.37=hab24e00_0
69
+ - font-ttf-inconsolata=3.000=h77eed37_0
70
+ - font-ttf-source-code-pro=2.038=h77eed37_0
71
+ - font-ttf-ubuntu=0.83=h77eed37_2
72
+ - fontconfig=2.14.2=h14ed4e7_0
73
+ - fonts-conda-ecosystem=1=0
74
+ - fonts-conda-forge=1=0
75
+ - freetype=2.12.1=h267a509_2
76
+ - fribidi=1.0.10=h36c2ea0_0
77
+ - gds-tools=1.6.0.25=0
78
+ - gettext=0.22.5=h59595ed_2
79
+ - gettext-tools=0.22.5=h59595ed_2
80
+ - git-lfs=3.5.1=ha770c72_0
81
+ - gmp=6.3.0=hac33072_2
82
+ - gmpy2=2.1.5=py311hc4f1f91_1
83
+ - gnutls=3.7.9=hb077bed_0
84
+ - graphite2=1.3.13=h59595ed_1003
85
+ - h2=4.1.0=pyhd8ed1ab_0
86
+ - harfbuzz=9.0.0=hda332d3_1
87
+ - hpack=4.0.0=pyh9f0ad1d_0
88
+ - hyperframe=6.0.1=pyhd8ed1ab_0
89
+ - icu=75.1=he02047a_0
90
+ - idna=3.7=pyhd8ed1ab_0
91
+ - importlib-metadata=8.2.0=pyha770c72_0
92
+ - importlib_metadata=8.2.0=hd8ed1ab_0
93
+ - intel-openmp=2022.0.1=h06a4308_3633
94
+ - ipykernel=6.29.5=pyh3099207_0
95
+ - ipython=8.26.0=pyh707e725_0
96
+ - jedi=0.19.1=pyhd8ed1ab_0
97
+ - jinja2=3.1.4=pyhd8ed1ab_0
98
+ - jupyter_client=8.6.2=pyhd8ed1ab_0
99
+ - jupyter_core=5.7.2=py311h38be061_0
100
+ - keyutils=1.6.1=h166bdaf_0
101
+ - krb5=1.21.3=h659f571_0
102
+ - lame=3.100=h166bdaf_1003
103
+ - lcms2=2.16=hb7c19ff_0
104
+ - ld_impl_linux-64=2.40=hf3520f5_7
105
+ - lerc=4.0.0=h27087fc_0
106
+ - libabseil=20240116.2=cxx17_he02047a_1
107
+ - libasprintf=0.22.5=h661eb56_2
108
+ - libasprintf-devel=0.22.5=h661eb56_2
109
+ - libass=0.17.1=h39113c1_2
110
+ - libblas=3.9.0=16_linux64_mkl
111
+ - libcblas=3.9.0=16_linux64_mkl
112
+ - libcublas=12.1.0.26=0
113
+ - libcublas-dev=12.1.0.26=0
114
+ - libcublas-static=12.1.0.26=0
115
+ - libcufft=11.0.2.4=0
116
+ - libcufft-dev=11.0.2.4=0
117
+ - libcufft-static=11.0.2.4=0
118
+ - libcufile=1.6.0.25=0
119
+ - libcufile-dev=1.6.0.25=0
120
+ - libcufile-static=1.6.0.25=0
121
+ - libcurand=10.3.2.56=0
122
+ - libcurand-dev=10.3.2.56=0
123
+ - libcurand-static=10.3.2.56=0
124
+ - libcusolver=11.4.4.55=0
125
+ - libcusolver-dev=11.4.4.55=0
126
+ - libcusolver-static=11.4.4.55=0
127
+ - libcusparse=12.0.2.55=0
128
+ - libcusparse-dev=12.0.2.55=0
129
+ - libcusparse-static=12.0.2.55=0
130
+ - libdeflate=1.20=hd590300_0
131
+ - libdrm=2.4.122=h4ab18f5_0
132
+ - libedit=3.1.20191231=he28a2e2_2
133
+ - libexpat=2.6.2=h59595ed_0
134
+ - libffi=3.4.2=h7f98852_5
135
+ - libgcc-ng=14.1.0=h77fa898_0
136
+ - libgettextpo=0.22.5=h59595ed_2
137
+ - libgettextpo-devel=0.22.5=h59595ed_2
138
+ - libglib=2.80.3=h8a4344b_1
139
+ - libgomp=14.1.0=h77fa898_0
140
+ - libhwloc=2.11.1=default_hecaa2ac_1000
141
+ - libiconv=1.17=hd590300_2
142
+ - libidn2=2.3.7=hd590300_0
143
+ - libjpeg-turbo=3.0.0=hd590300_1
144
+ - liblapack=3.9.0=16_linux64_mkl
145
+ - libnpp=12.0.2.50=0
146
+ - libnpp-dev=12.0.2.50=0
147
+ - libnpp-static=12.0.2.50=0
148
+ - libnsl=2.0.1=hd590300_0
149
+ - libnvjitlink=12.1.105=0
150
+ - libnvjitlink-dev=12.1.55=0
151
+ - libnvjpeg=12.1.0.39=0
152
+ - libnvjpeg-dev=12.1.0.39=0
153
+ - libnvjpeg-static=12.1.0.39=0
154
+ - libnvvm-samples=12.1.55=0
155
+ - libopenvino=2024.2.0=h2da1b83_1
156
+ - libopenvino-auto-batch-plugin=2024.2.0=hb045406_1
157
+ - libopenvino-auto-plugin=2024.2.0=hb045406_1
158
+ - libopenvino-hetero-plugin=2024.2.0=h5c03a75_1
159
+ - libopenvino-intel-cpu-plugin=2024.2.0=h2da1b83_1
160
+ - libopenvino-intel-gpu-plugin=2024.2.0=h2da1b83_1
161
+ - libopenvino-intel-npu-plugin=2024.2.0=he02047a_1
162
+ - libopenvino-ir-frontend=2024.2.0=h5c03a75_1
163
+ - libopenvino-onnx-frontend=2024.2.0=h07e8aee_1
164
+ - libopenvino-paddle-frontend=2024.2.0=h07e8aee_1
165
+ - libopenvino-pytorch-frontend=2024.2.0=he02047a_1
166
+ - libopenvino-tensorflow-frontend=2024.2.0=h39126c6_1
167
+ - libopenvino-tensorflow-lite-frontend=2024.2.0=he02047a_1
168
+ - libopus=1.3.1=h7f98852_1
169
+ - libpciaccess=0.18=hd590300_0
170
+ - libpng=1.6.43=h2797004_0
171
+ - libprotobuf=4.25.3=h08a7969_0
172
+ - libsodium=1.0.18=h36c2ea0_1
173
+ - libsqlite=3.46.0=hde9e2c9_0
174
+ - libstdcxx-ng=14.1.0=hc0a3c3a_0
175
+ - libtasn1=4.19.0=h166bdaf_0
176
+ - libtiff=4.6.0=h1dd3fc0_3
177
+ - libunistring=0.9.10=h7f98852_0
178
+ - libuuid=2.38.1=h0b41bf4_0
179
+ - libva=2.22.0=hb711507_0
180
+ - libvpx=1.14.1=hac33072_0
181
+ - libwebp-base=1.4.0=hd590300_0
182
+ - libxcb=1.16=hd590300_0
183
+ - libxcrypt=4.4.36=hd590300_1
184
+ - libxml2=2.12.7=he7c6b58_4
185
+ - libzlib=1.3.1=h4ab18f5_1
186
+ - llvm-openmp=15.0.7=h0cdce71_0
187
+ - markupsafe=2.1.5=py311h459d7ec_0
188
+ - matplotlib-inline=0.1.7=pyhd8ed1ab_0
189
+ - mkl=2022.1.0=hc2b9512_224
190
+ - mpc=1.3.1=hfe3b2da_0
191
+ - mpfr=4.2.1=h38ae2d0_2
192
+ - mpmath=1.3.0=pyhd8ed1ab_0
193
+ - ncurses=6.5=h59595ed_0
194
+ - nest-asyncio=1.6.0=pyhd8ed1ab_0
195
+ - nettle=3.9.1=h7ab15ed_0
196
+ - networkx=3.3=pyhd8ed1ab_1
197
+ - nsight-compute=2023.1.0.15=0
198
+ - ocl-icd=2.3.2=hd590300_1
199
+ - openh264=2.4.1=h59595ed_0
200
+ - openjpeg=2.5.2=h488ebb8_0
201
+ - openssl=3.3.1=h4bc722e_2
202
+ - p11-kit=0.24.1=hc5aa10d_0
203
+ - packaging=24.1=pyhd8ed1ab_0
204
+ - parso=0.8.4=pyhd8ed1ab_0
205
+ - pcre2=10.44=h0f59acf_0
206
+ - pexpect=4.9.0=pyhd8ed1ab_0
207
+ - pickleshare=0.7.5=py_1003
208
+ - pillow=10.4.0=py311h82a398c_0
209
+ - pip=24.0=pyhd8ed1ab_0
210
+ - pixman=0.43.2=h59595ed_0
211
+ - prompt-toolkit=3.0.47=pyha770c72_0
212
+ - psutil=6.0.0=py311h331c9d8_0
213
+ - pthread-stubs=0.4=h36c2ea0_1001
214
+ - ptyprocess=0.7.0=pyhd3deb0d_0
215
+ - pugixml=1.14=h59595ed_0
216
+ - pure_eval=0.2.3=pyhd8ed1ab_0
217
+ - pycparser=2.22=pyhd8ed1ab_0
218
+ - pygments=2.18.0=pyhd8ed1ab_0
219
+ - pysocks=1.7.1=pyha2e5f31_6
220
+ - python=3.11.9=hb806964_0_cpython
221
+ - python_abi=3.11=4_cp311
222
+ - pytorch=2.4.0=py3.11_cuda12.1_cudnn9.1.0_0
223
+ - pytorch-cuda=12.1=ha16c6d3_5
224
+ - pytorch-mutex=1.0=cuda
225
+ - pyyaml=6.0.1=py311h459d7ec_1
226
+ - pyzmq=26.0.3=py311h08a0b41_0
227
+ - readline=8.2=h8228510_1
228
+ - requests=2.32.3=pyhd8ed1ab_0
229
+ - setuptools=71.0.4=pyhd8ed1ab_0
230
+ - six=1.16.0=pyh6c4a22f_0
231
+ - snappy=1.2.1=ha2e4443_0
232
+ - stack_data=0.6.2=pyhd8ed1ab_0
233
+ - svt-av1=2.1.2=hac33072_0
234
+ - sympy=1.13.0=pypyh2585a3b_103
235
+ - tbb=2021.12.0=h434a139_3
236
+ - tk=8.6.13=noxft_h4845f30_101
237
+ - torchaudio=2.4.0=py311_cu121
238
+ - torchtriton=3.0.0=py311
239
+ - tornado=6.4.1=py311h331c9d8_0
240
+ - traitlets=5.14.3=pyhd8ed1ab_0
241
+ - typing_extensions=4.12.2=pyha770c72_0
242
+ - urllib3=2.2.2=pyhd8ed1ab_1
243
+ - wayland=1.23.0=h5291e77_0
244
+ - wayland-protocols=1.36=hd8ed1ab_0
245
+ - wcwidth=0.2.13=pyhd8ed1ab_0
246
+ - wheel=0.43.0=pyhd8ed1ab_1
247
+ - x264=1!164.3095=h166bdaf_2
248
+ - x265=3.5=h924138e_3
249
+ - xorg-fixesproto=5.0=h7f98852_1002
250
+ - xorg-kbproto=1.0.7=h7f98852_1002
251
+ - xorg-libice=1.1.1=hd590300_0
252
+ - xorg-libsm=1.2.4=h7391055_0
253
+ - xorg-libx11=1.8.9=hb711507_1
254
+ - xorg-libxau=1.0.11=hd590300_0
255
+ - xorg-libxdmcp=1.1.3=h7f98852_0
256
+ - xorg-libxext=1.3.4=h0b41bf4_2
257
+ - xorg-libxfixes=5.0.3=h7f98852_1004
258
+ - xorg-libxrender=0.9.11=hd590300_0
259
+ - xorg-renderproto=0.11.1=h7f98852_1002
260
+ - xorg-xextproto=7.3.0=h0b41bf4_1003
261
+ - xorg-xproto=7.0.31=h7f98852_1007
262
+ - xz=5.2.6=h166bdaf_0
263
+ - yaml=0.2.5=h7f98852_2
264
+ - zeromq=4.3.5=h75354e8_4
265
+ - zipp=3.19.2=pyhd8ed1ab_0
266
+ - zlib=1.3.1=h4ab18f5_1
267
+ - zstandard=0.23.0=py311h5cd10c7_0
268
+ - zstd=1.5.6=ha6fb4c9_0
269
+ - pip:
270
+ - about-time==4.2.1
271
+ - absl-py==2.1.0
272
+ - accelerate==0.34.0
273
+ - aiofiles==23.2.1
274
+ - aiohttp==3.9.5
275
+ - aiohttp-retry==2.8.3
276
+ - aiosignal==1.3.1
277
+ - align-anything==0.0.1.dev0
278
+ - alive-progress==3.1.5
279
+ - amqp==5.2.0
280
+ - annotated-types==0.7.0
281
+ - antlr4-python3-runtime==4.9.3
282
+ - anyio==4.4.0
283
+ - appdirs==1.4.4
284
+ - asyncssh==2.16.0
285
+ - atpublic==5.0
286
+ - attrs==23.2.0
287
+ - audioread==3.0.1
288
+ - backoff==2.2.1
289
+ - billiard==4.2.0
290
+ - boto3==1.35.9
291
+ - botocore==1.35.9
292
+ - cachetools==5.4.0
293
+ - celery==5.4.0
294
+ - cfgv==3.4.0
295
+ - click==8.1.7
296
+ - click-didyoumean==0.3.1
297
+ - click-plugins==1.1.1
298
+ - click-repl==0.3.0
299
+ - cloudpickle==3.0.0
300
+ - cmake==3.30.1
301
+ - colorama==0.4.6
302
+ - commonmark==0.9.1
303
+ - configobj==5.0.8
304
+ - contourpy==1.2.1
305
+ - cryptography==43.0.0
306
+ - cycler==0.12.1
307
+ - dacite==1.6.0
308
+ - dagshub==0.3.35
309
+ - dagshub-annotation-converter==0.1.0
310
+ - dataclasses-json==0.6.7
311
+ - datasets==2.20.0
312
+ - decorator==4.4.2
313
+ - deepspeed==0.14.4
314
+ - dictdiffer==0.9.0
315
+ - diffusers==0.29.2
316
+ - dill==0.3.8
317
+ - diskcache==5.6.3
318
+ - distlib==0.3.8
319
+ - distro==1.9.0
320
+ - dnspython==2.6.1
321
+ - docker-pycreds==0.4.0
322
+ - docstring-parser==0.16
323
+ - dpath==2.2.0
324
+ - dulwich==0.22.1
325
+ - dvc==3.55.1
326
+ - dvc-data==3.16.5
327
+ - dvc-http==2.32.0
328
+ - dvc-objects==5.1.0
329
+ - dvc-render==1.0.2
330
+ - dvc-studio-client==0.21.0
331
+ - dvc-task==0.4.0
332
+ - einops==0.8.0
333
+ - email-validator==2.2.0
334
+ - entrypoints==0.4
335
+ - fastapi==0.111.1
336
+ - fastapi-cli==0.0.4
337
+ - ffmpy==0.3.3
338
+ - fire==0.6.0
339
+ - flatten-dict==0.4.2
340
+ - flufl-lock==8.1.0
341
+ - fonttools==4.53.1
342
+ - frozenlist==1.4.1
343
+ - fsspec==2024.5.0
344
+ - funcy==2.0
345
+ - fusepy==3.0.1
346
+ - gitdb==4.0.11
347
+ - gitpython==3.1.43
348
+ - gql==3.5.0
349
+ - gradio==4.39.0
350
+ - gradio-client==1.1.1
351
+ - gradio-multimodalchatbot==0.0.1
352
+ - grandalf==0.8
353
+ - grapheme==0.6.0
354
+ - graphql-core==3.2.3
355
+ - grpcio==1.65.1
356
+ - gto==1.7.1
357
+ - h11==0.14.0
358
+ - hjson==3.1.0
359
+ - httpcore==1.0.5
360
+ - httptools==0.6.1
361
+ - httpx==0.27.2
362
+ - huggingface-hub==0.24.3
363
+ - hydra-core==1.3.2
364
+ - identify==2.6.0
365
+ - imageio==2.35.1
366
+ - imageio-ffmpeg==0.5.1
367
+ - importlib-resources==6.4.0
368
+ - iniconfig==2.0.0
369
+ - interegular==0.3.3
370
+ - iterative-telemetry==0.0.8
371
+ - jmespath==1.0.1
372
+ - joblib==1.4.2
373
+ - jsonschema==4.23.0
374
+ - jsonschema-specifications==2023.12.1
375
+ - kiwisolver==1.4.5
376
+ - kombu==5.4.0
377
+ - lark==1.1.9
378
+ - lazy-loader==0.4
379
+ - librosa==0.10.2.post1
380
+ - llamafactory==0.8.4.dev0
381
+ - llvmlite==0.43.0
382
+ - lm-format-enforcer==0.10.3
383
+ - lxml==5.3.0
384
+ - markdown==3.6
385
+ - markdown-it-py==3.0.0
386
+ - marshmallow==3.22.0
387
+ - matplotlib==3.9.1
388
+ - mdurl==0.1.2
389
+ - mmsg==0.1.dev14+gbd2b056.d20240803
390
+ - moviepy==1.0.3
391
+ - mpi4py==4.0.0
392
+ - msgpack==1.0.8
393
+ - multidict==6.0.5
394
+ - multiprocess==0.70.16
395
+ - mypy-extensions==1.0.0
396
+ - ninja==1.11.1.1
397
+ - nodeenv==1.9.1
398
+ - numba==0.60.0
399
+ - numpy==1.26.4
400
+ - nvidia-cublas-cu12==12.1.3.1
401
+ - nvidia-cuda-cupti-cu12==12.1.105
402
+ - nvidia-cuda-nvrtc-cu12==12.1.105
403
+ - nvidia-cuda-runtime-cu12==12.1.105
404
+ - nvidia-cudnn-cu12==8.9.2.26
405
+ - nvidia-cufft-cu12==11.0.2.54
406
+ - nvidia-curand-cu12==10.3.2.106
407
+ - nvidia-cusolver-cu12==11.4.5.107
408
+ - nvidia-cusparse-cu12==12.1.0.106
409
+ - nvidia-ml-py==12.535.161
410
+ - nvidia-nccl-cu12==2.20.5
411
+ - nvidia-nvjitlink-cu12==12.5.82
412
+ - nvidia-nvtx-cu12==12.1.105
413
+ - nvitop==1.3.2
414
+ - omegaconf==2.3.0
415
+ - openai==1.37.1
416
+ - optree==0.12.1
417
+ - orjson==3.10.6
418
+ - outlines==0.0.47.dev37+g26e2934
419
+ - pandas==2.2.2
420
+ - pathspec==0.12.1
421
+ - pathvalidate==3.0.0
422
+ - peft==0.12.0
423
+ - platformdirs==3.11.0
424
+ - pluggy==1.5.0
425
+ - pooch==1.8.2
426
+ - pre-commit==3.8.0
427
+ - proglog==0.1.10
428
+ - prometheus-client==0.20.0
429
+ - prometheus-fastapi-instrumentator==7.0.0
430
+ - protobuf==4.25.4
431
+ - py-cpuinfo==9.0.0
432
+ - pyairports==2.1.1
433
+ - pyarrow==17.0.0
434
+ - pyarrow-hotfix==0.6
435
+ - pyav==13.0.0
436
+ - pycountry==24.6.1
437
+ - pydantic==2.8.2
438
+ - pydantic-core==2.20.1
439
+ - pydot==3.0.1
440
+ - pydub==0.25.1
441
+ - pygit2==1.15.1
442
+ - pygtrie==2.5.0
443
+ - pyparsing==3.1.2
444
+ - pytest==8.3.2
445
+ - python-dateutil==2.9.0.post0
446
+ - python-dotenv==1.0.1
447
+ - python-multipart==0.0.9
448
+ - pytz==2024.1
449
+ - ranger-fm==1.9.3
450
+ - ray==2.34.0
451
+ - referencing==0.35.1
452
+ - regex==2024.7.24
453
+ - requests-toolbelt==1.0.0
454
+ - rfc3986==1.5.0
455
+ - rich==13.1.0
456
+ - rpds-py==0.19.1
457
+ - ruamel-yaml==0.18.6
458
+ - ruamel-yaml-clib==0.2.8
459
+ - ruff==0.5.5
460
+ - s3transfer==0.10.2
461
+ - safetensors==0.4.3
462
+ - scikit-learn==1.5.1
463
+ - scipy==1.14.0
464
+ - scmrepo==3.3.7
465
+ - semantic-version==2.10.0
466
+ - semver==3.0.2
467
+ - sentencepiece==0.2.0
468
+ - sentry-sdk==2.11.0
469
+ - setproctitle==1.3.3
470
+ - shellingham==1.5.4
471
+ - shortuuid==1.0.13
472
+ - shtab==1.7.1
473
+ - smmap==5.0.1
474
+ - sniffio==1.3.1
475
+ - soundfile==0.12.1
476
+ - soxr==0.4.0
477
+ - sqltrie==0.11.1
478
+ - sse-starlette==2.1.3
479
+ - starlette==0.37.2
480
+ - tabulate==0.9.0
481
+ - tenacity==8.2.3
482
+ - tensorboard==2.17.0
483
+ - tensorboard-data-server==0.7.2
484
+ - term-image==0.7.2
485
+ - termcolor==2.4.0
486
+ - threadpoolctl==3.5.0
487
+ - tiktoken==0.7.0
488
+ - tokenizers==0.19.1
489
+ - tomlkit==0.12.0
490
+ - torch==2.3.1
491
+ - torchvision==0.18.1
492
+ - tqdm==4.66.4
493
+ - transformers==4.45.0.dev0
494
+ - treelib==1.6.4
495
+ - triton==2.3.1
496
+ - trl==0.9.6
497
+ - typer==0.12.3
498
+ - typing-inspect==0.9.0
499
+ - tyro==0.8.10
500
+ - tzdata==2024.1
501
+ - uvicorn==0.30.3
502
+ - uvloop==0.19.0
503
+ - vine==5.1.0
504
+ - virtualenv==20.26.3
505
+ - vllm==0.5.3.post1
506
+ - vllm-flash-attn==2.5.9.post1
507
+ - voluptuous==0.15.2
508
+ - wandb==0.17.5
509
+ - watchfiles==0.22.0
510
+ - websockets==11.0.3
511
+ - werkzeug==3.0.3
512
+ - xformers==0.0.27
513
+ - xxhash==3.4.1
514
+ - yarl==1.9.4
515
+ - zc-lockfile==3.0.post1
516
+ prefix: /aifs4su/yaodong/miniconda3/envs/hantao_tiv
wandb/run-20240921_050939-9z0w7l09/files/config.yaml ADDED
@@ -0,0 +1,112 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ wandb_version: 1
2
+
3
+ train_cfgs:
4
+ desc: null
5
+ value:
6
+ ds_cfgs: ds_z3_config.json
7
+ epochs: 3
8
+ seed: 42
9
+ per_device_train_batch_size: 1.0
10
+ per_device_eval_batch_size: 1.0
11
+ gradient_accumulation_steps: 1.0
12
+ gradient_checkpointing: true
13
+ learning_rate: 1.0e-06
14
+ lr_scheduler_type: cosine
15
+ lr_warmup_ratio: 0.01
16
+ weight_decay: 0.0
17
+ adam_betas:
18
+ - 0.9
19
+ - 0.95
20
+ bf16: true
21
+ fp16: false
22
+ eval_strategy: epoch
23
+ eval_interval: 10
24
+ regularization: 0.001
25
+ scale_coeff: 0.1
26
+ freeze_mm_proj: false
27
+ freeze_vision_tower: true
28
+ freeze_language_model: false
29
+ data_cfgs:
30
+ desc: null
31
+ value:
32
+ train_datasets: /aifs4su/yaodong/datasets/aaa_dataset/TV2T-preference/extracted
33
+ train_template: NExTQA_preference
34
+ train_size: null
35
+ train_split: train
36
+ train_subset: null
37
+ train_data_files: extracted_preference_1.5k_washed.json
38
+ train_optional_args: []
39
+ eval_datasets: null
40
+ eval_template: null
41
+ eval_size: null
42
+ eval_split: null
43
+ eval_subset: null
44
+ eval_data_files: null
45
+ eval_optional_args: []
46
+ logger_cfgs:
47
+ desc: null
48
+ value:
49
+ log_type: wandb
50
+ log_project: align-anything
51
+ log_run_name: dpo
52
+ output_dir: ../outputs/dpo_tiv2t_1.5k_base
53
+ cache_dir: null
54
+ save_interval: 100000
55
+ model_cfgs:
56
+ desc: null
57
+ value:
58
+ model_name_or_path: /aifs4su/yaodong/models/Qwen2-VL-7B-Instruct
59
+ trust_remote_code: true
60
+ model_max_length: 4096
61
+ special_tokens:
62
+ desc: null
63
+ value: null
64
+ _wandb:
65
+ desc: null
66
+ value:
67
+ python_version: 3.11.9
68
+ cli_version: 0.17.5
69
+ framework: huggingface
70
+ huggingface_version: 4.45.0.dev0
71
+ is_jupyter_run: false
72
+ is_kaggle_kernel: false
73
+ start_time: 1726866579
74
+ t:
75
+ 1:
76
+ - 1
77
+ - 5
78
+ - 11
79
+ - 41
80
+ - 49
81
+ - 51
82
+ - 53
83
+ - 55
84
+ - 71
85
+ - 83
86
+ - 98
87
+ - 105
88
+ 2:
89
+ - 1
90
+ - 5
91
+ - 11
92
+ - 41
93
+ - 49
94
+ - 51
95
+ - 53
96
+ - 55
97
+ - 71
98
+ - 83
99
+ - 98
100
+ - 105
101
+ 3:
102
+ - 2
103
+ - 13
104
+ - 16
105
+ - 23
106
+ - 61
107
+ 4: 3.11.9
108
+ 5: 0.17.5
109
+ 6: 4.45.0.dev0
110
+ 8:
111
+ - 5
112
+ 13: linux-x86_64
wandb/run-20240921_050939-9z0w7l09/files/output.log ADDED
@@ -0,0 +1,206 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+
2
+ ***** Running training *****
3
+
4
+ Training 1/3 epoch: 0%| | 0/531 [00:00<?, ?it/s]`use_cache=True` is incompatible with gradient checkpointing. Setting `use_cache=False`...
5
+ /aifs4su/yaodong/miniconda3/envs/hantao_tiv/lib/python3.11/site-packages/torch/utils/checkpoint.py:295: FutureWarning: `torch.cpu.amp.autocast(args...)` is deprecated. Please use `torch.amp.autocast('cpu', args...)` instead.
6
+ with torch.enable_grad(), device_autocast_ctx, torch.cpu.amp.autocast(**ctx.cpu_autocast_kwargs): # type: ignore[attr-defined]
7
+
8
+
9
+
10
+
11
+
12
+
13
+
14
+
15
+ Training 1/3 epoch (loss 0.6357): 2%|█▋ | 9/531 [01:30<1:21:14, 9.34s/it]
16
+
17
+
18
+
19
+
20
+
21
+
22
+
23
+
24
+
25
+
26
+ Training 1/3 epoch (loss 1.1789): 4%|███▌ | 19/531 [03:00<1:15:00, 8.79s/it]
27
+
28
+
29
+
30
+
31
+
32
+
33
+
34
+
35
+
36
+
37
+ Training 1/3 epoch (loss 0.6288): 5%|█████▍ | 29/531 [04:47<1:30:27, 10.81s/it]
38
+
39
+
40
+
41
+
42
+
43
+
44
+
45
+
46
+
47
+
48
+ Training 1/3 epoch (loss 0.3259): 7%|███████▎ | 39/531 [06:44<1:33:55, 11.46s/it]
49
+
50
+
51
+
52
+
53
+
54
+
55
+
56
+
57
+
58
+
59
+ Training 1/3 epoch (loss 0.9580): 9%|█████████▏ | 49/531 [08:26<1:20:24, 10.01s/it]
60
+
61
+
62
+
63
+
64
+
65
+
66
+
67
+
68
+
69
+
70
+ Training 1/3 epoch (loss 0.2154): 11%|███████████ | 59/531 [10:01<1:14:08, 9.43s/it]
71
+
72
+
73
+
74
+
75
+
76
+
77
+
78
+
79
+
80
+
81
+ Training 1/3 epoch (loss 0.5728): 13%|████████████▉ | 69/531 [11:44<1:22:35, 10.73s/it]
82
+
83
+
84
+
85
+
86
+
87
+
88
+
89
+
90
+
91
+
92
+ Training 1/3 epoch (loss 0.9818): 15%|██████████████▉ | 79/531 [13:38<1:16:33, 10.16s/it]
93
+
94
+
95
+
96
+
97
+
98
+
99
+
100
+
101
+
102
+
103
+
104
+ Training 1/3 epoch (loss 0.3341): 17%|████████████████▊ | 89/531 [15:09<1:10:36, 9.58s/it]
105
+
106
+
107
+
108
+
109
+
110
+
111
+
112
+
113
+
114
+
115
+
116
+ Training 1/3 epoch (loss 0.6811): 19%|██████████████████▋ | 99/531 [16:57<1:07:05, 9.32s/it]
117
+
118
+
119
+
120
+
121
+
122
+
123
+
124
+
125
+
126
+
127
+
128
+ Training 1/3 epoch (loss 0.3843): 21%|████████████████████▎ | 109/531 [18:36<1:11:34, 10.18s/it]
129
+
130
+
131
+
132
+
133
+
134
+
135
+
136
+
137
+
138
+
139
+ Training 1/3 epoch (loss 0.8316): 22%|██████████████████████▏ | 119/531 [20:10<1:02:22, 9.08s/it]
140
+
141
+
142
+
143
+
144
+
145
+
146
+
147
+
148
+
149
+
150
+ Training 1/3 epoch (loss 0.9861): 24%|████████████████████████▌ | 129/531 [21:37<59:53, 8.94s/it]
151
+
152
+
153
+
154
+
155
+
156
+
157
+
158
+
159
+
160
+
161
+ Training 1/3 epoch (loss 0.5590): 26%|██████████████████████████▍ | 139/531 [22:58<50:15, 7.69s/it]
162
+
163
+
164
+
165
+
166
+
167
+
168
+
169
+
170
+
171
+ Training 1/3 epoch (loss 0.6365): 28%|███████████████████████████▌ | 148/531 [24:33<1:16:08, 11.93s/it]Traceback (most recent call last):
172
+ File "<frozen runpy>", line 198, in _run_module_as_main
173
+ File "<frozen runpy>", line 88, in _run_code
174
+ File "/aifs4su/yaodong/projects/hantao/dev_cham/align-anything/align_anything/trainers/tiv_to_t/dpo.py", line 182, in <module>
175
+ sys.exit(main())
176
+ ^^^^^^
177
+ File "/aifs4su/yaodong/projects/hantao/dev_cham/align-anything/align_anything/trainers/tiv_to_t/dpo.py", line 177, in main
178
+ trainer.train()
179
+ File "/aifs4su/yaodong/projects/hantao/dev_cham/align-anything/align_anything/trainers/text_to_text/dpo.py", line 254, in train
180
+ info = self.train_step(batch)
181
+ ^^^^^^^^^^^^^^^^^^^^^^
182
+ File "/aifs4su/yaodong/projects/hantao/dev_cham/align-anything/align_anything/trainers/text_to_text/dpo.py", line 205, in train_step
183
+ loss_dict = self.loss(batch=batch)
184
+ ^^^^^^^^^^^^^^^^^^^^^^
185
+ File "/aifs4su/yaodong/projects/hantao/dev_cham/align-anything/align_anything/trainers/tiv_to_t/dpo.py", line 136, in loss
186
+ loss = torch.stack(losses).mean() # size = ()
187
+ ^^^^^^^^^^^^^^^^^^^
188
+ RuntimeError: stack expects a non-empty TensorList
189
+ [rank0]: Traceback (most recent call last):
190
+ [rank0]: File "<frozen runpy>", line 198, in _run_module_as_main
191
+ [rank0]: File "<frozen runpy>", line 88, in _run_code
192
+ [rank0]: File "/aifs4su/yaodong/projects/hantao/dev_cham/align-anything/align_anything/trainers/tiv_to_t/dpo.py", line 182, in <module>
193
+ [rank0]: sys.exit(main())
194
+ [rank0]: ^^^^^^
195
+ [rank0]: File "/aifs4su/yaodong/projects/hantao/dev_cham/align-anything/align_anything/trainers/tiv_to_t/dpo.py", line 177, in main
196
+ [rank0]: trainer.train()
197
+ [rank0]: File "/aifs4su/yaodong/projects/hantao/dev_cham/align-anything/align_anything/trainers/text_to_text/dpo.py", line 254, in train
198
+ [rank0]: info = self.train_step(batch)
199
+ [rank0]: ^^^^^^^^^^^^^^^^^^^^^^
200
+ [rank0]: File "/aifs4su/yaodong/projects/hantao/dev_cham/align-anything/align_anything/trainers/text_to_text/dpo.py", line 205, in train_step
201
+ [rank0]: loss_dict = self.loss(batch=batch)
202
+ [rank0]: ^^^^^^^^^^^^^^^^^^^^^^
203
+ [rank0]: File "/aifs4su/yaodong/projects/hantao/dev_cham/align-anything/align_anything/trainers/tiv_to_t/dpo.py", line 136, in loss
204
+ [rank0]: loss = torch.stack(losses).mean() # size = ()
205
+ [rank0]: ^^^^^^^^^^^^^^^^^^^
206
+ [rank0]: RuntimeError: stack expects a non-empty TensorList
wandb/run-20240921_050939-9z0w7l09/files/requirements.txt ADDED
@@ -0,0 +1,325 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ Brotli==1.1.0
2
+ GitPython==3.1.43
3
+ Jinja2==3.1.4
4
+ Markdown==3.6
5
+ MarkupSafe==2.1.5
6
+ PySocks==1.7.1
7
+ PyYAML==6.0.1
8
+ Pygments==2.18.0
9
+ Werkzeug==3.0.3
10
+ about-time==4.2.1
11
+ absl-py==2.1.0
12
+ accelerate==0.34.0
13
+ aiofiles==23.2.1
14
+ aiohttp-retry==2.8.3
15
+ aiohttp==3.9.5
16
+ aiosignal==1.3.1
17
+ align-anything==0.0.1.dev0
18
+ align-anything==0.0.1.dev0
19
+ alive-progress==3.1.5
20
+ amqp==5.2.0
21
+ annotated-types==0.7.0
22
+ antlr4-python3-runtime==4.9.3
23
+ anyio==4.4.0
24
+ appdirs==1.4.4
25
+ asttokens==2.4.1
26
+ asyncssh==2.16.0
27
+ atpublic==5.0
28
+ attrs==23.2.0
29
+ audioread==3.0.1
30
+ autocommand==2.2.2
31
+ backoff==2.2.1
32
+ backports.tarfile==1.2.0
33
+ billiard==4.2.0
34
+ boto3==1.35.9
35
+ botocore==1.35.9
36
+ cachetools==5.4.0
37
+ celery==5.4.0
38
+ certifi==2024.7.4
39
+ cffi==1.16.0
40
+ cfgv==3.4.0
41
+ charset-normalizer==3.3.2
42
+ click-didyoumean==0.3.1
43
+ click-plugins==1.1.1
44
+ click-repl==0.3.0
45
+ click==8.1.7
46
+ cloudpickle==3.0.0
47
+ cmake==3.30.1
48
+ colorama==0.4.6
49
+ comm==0.2.2
50
+ commonmark==0.9.1
51
+ configobj==5.0.8
52
+ contourpy==1.2.1
53
+ cryptography==43.0.0
54
+ cycler==0.12.1
55
+ dacite==1.6.0
56
+ dagshub-annotation-converter==0.1.0
57
+ dagshub==0.3.35
58
+ dataclasses-json==0.6.7
59
+ datasets==2.20.0
60
+ debugpy==1.8.2
61
+ decorator==4.4.2
62
+ deepspeed==0.14.4
63
+ dictdiffer==0.9.0
64
+ diffusers==0.29.2
65
+ dill==0.3.8
66
+ diskcache==5.6.3
67
+ distlib==0.3.8
68
+ distro==1.9.0
69
+ dnspython==2.6.1
70
+ docker-pycreds==0.4.0
71
+ docstring_parser==0.16
72
+ dpath==2.2.0
73
+ dulwich==0.22.1
74
+ dvc-data==3.16.5
75
+ dvc-http==2.32.0
76
+ dvc-objects==5.1.0
77
+ dvc-render==1.0.2
78
+ dvc-studio-client==0.21.0
79
+ dvc-task==0.4.0
80
+ dvc==3.55.1
81
+ einops==0.8.0
82
+ email_validator==2.2.0
83
+ entrypoints==0.4
84
+ exceptiongroup==1.2.2
85
+ executing==2.0.1
86
+ fastapi-cli==0.0.4
87
+ fastapi==0.111.1
88
+ ffmpy==0.3.3
89
+ filelock==3.15.4
90
+ fire==0.6.0
91
+ flatten-dict==0.4.2
92
+ flufl.lock==8.1.0
93
+ fonttools==4.53.1
94
+ frozenlist==1.4.1
95
+ fsspec==2024.5.0
96
+ funcy==2.0
97
+ fusepy==3.0.1
98
+ gitdb==4.0.11
99
+ gmpy2==2.1.5
100
+ gql==3.5.0
101
+ gradio==4.39.0
102
+ gradio_client==1.1.1
103
+ gradio_multimodalchatbot==0.0.1
104
+ grandalf==0.8
105
+ grapheme==0.6.0
106
+ graphql-core==3.2.3
107
+ grpcio==1.65.1
108
+ gto==1.7.1
109
+ h11==0.14.0
110
+ h2==4.1.0
111
+ hjson==3.1.0
112
+ hpack==4.0.0
113
+ httpcore==1.0.5
114
+ httptools==0.6.1
115
+ httpx==0.27.2
116
+ huggingface-hub==0.24.3
117
+ hydra-core==1.3.2
118
+ hyperframe==6.0.1
119
+ identify==2.6.0
120
+ idna==3.7
121
+ imageio-ffmpeg==0.5.1
122
+ imageio==2.35.1
123
+ importlib_metadata==8.0.0
124
+ importlib_metadata==8.2.0
125
+ importlib_resources==6.4.0
126
+ importlib_resources==6.4.0
127
+ inflect==7.3.1
128
+ iniconfig==2.0.0
129
+ interegular==0.3.3
130
+ ipykernel==6.29.5
131
+ ipython==8.26.0
132
+ iterative-telemetry==0.0.8
133
+ jaraco.context==5.3.0
134
+ jaraco.functools==4.0.1
135
+ jaraco.text==3.12.1
136
+ jedi==0.19.1
137
+ jmespath==1.0.1
138
+ joblib==1.4.2
139
+ jsonschema-specifications==2023.12.1
140
+ jsonschema==4.23.0
141
+ jupyter_client==8.6.2
142
+ jupyter_core==5.7.2
143
+ kiwisolver==1.4.5
144
+ kombu==5.4.0
145
+ lark==1.1.9
146
+ lazy_loader==0.4
147
+ librosa==0.10.2.post1
148
+ llamafactory==0.8.4.dev0
149
+ llamafactory==0.8.4.dev0
150
+ llvmlite==0.43.0
151
+ lm-format-enforcer==0.10.3
152
+ lxml==5.3.0
153
+ markdown-it-py==3.0.0
154
+ marshmallow==3.22.0
155
+ matplotlib-inline==0.1.7
156
+ matplotlib==3.9.1
157
+ mdurl==0.1.2
158
+ mmsg==0.1.dev14+gbd2b056.d20240803
159
+ more-itertools==10.3.0
160
+ moviepy==1.0.3
161
+ mpi4py==4.0.0
162
+ mpmath==1.3.0
163
+ msgpack==1.0.8
164
+ multidict==6.0.5
165
+ multiprocess==0.70.16
166
+ mypy-extensions==1.0.0
167
+ nest_asyncio==1.6.0
168
+ networkx==3.3
169
+ ninja==1.11.1.1
170
+ nodeenv==1.9.1
171
+ numba==0.60.0
172
+ numpy==1.26.4
173
+ nvidia-cublas-cu12==12.1.3.1
174
+ nvidia-cuda-cupti-cu12==12.1.105
175
+ nvidia-cuda-nvrtc-cu12==12.1.105
176
+ nvidia-cuda-runtime-cu12==12.1.105
177
+ nvidia-cudnn-cu12==8.9.2.26
178
+ nvidia-cufft-cu12==11.0.2.54
179
+ nvidia-curand-cu12==10.3.2.106
180
+ nvidia-cusolver-cu12==11.4.5.107
181
+ nvidia-cusparse-cu12==12.1.0.106
182
+ nvidia-ml-py==12.535.161
183
+ nvidia-nccl-cu12==2.20.5
184
+ nvidia-nvjitlink-cu12==12.5.82
185
+ nvidia-nvtx-cu12==12.1.105
186
+ nvitop==1.3.2
187
+ omegaconf==2.3.0
188
+ openai==1.37.1
189
+ optree==0.12.1
190
+ ordered-set==4.1.0
191
+ orjson==3.10.6
192
+ outlines==0.0.47.dev37+g26e2934
193
+ packaging==24.1
194
+ packaging==24.1
195
+ pandas==2.2.2
196
+ parso==0.8.4
197
+ pathspec==0.12.1
198
+ pathvalidate==3.0.0
199
+ peft==0.12.0
200
+ pexpect==4.9.0
201
+ pickleshare==0.7.5
202
+ pillow==10.4.0
203
+ pip==24.0
204
+ platformdirs==3.11.0
205
+ platformdirs==4.2.2
206
+ pluggy==1.5.0
207
+ pooch==1.8.2
208
+ pre-commit==3.8.0
209
+ proglog==0.1.10
210
+ prometheus-fastapi-instrumentator==7.0.0
211
+ prometheus_client==0.20.0
212
+ prompt_toolkit==3.0.47
213
+ protobuf==4.25.4
214
+ psutil==6.0.0
215
+ ptyprocess==0.7.0
216
+ pure_eval==0.2.3
217
+ py-cpuinfo==9.0.0
218
+ pyairports==2.1.1
219
+ pyarrow-hotfix==0.6
220
+ pyarrow==17.0.0
221
+ pyav==13.0.0
222
+ pycountry==24.6.1
223
+ pycparser==2.22
224
+ pydantic==2.8.2
225
+ pydantic_core==2.20.1
226
+ pydot==3.0.1
227
+ pydub==0.25.1
228
+ pygit2==1.15.1
229
+ pygtrie==2.5.0
230
+ pyparsing==3.1.2
231
+ pytest==8.3.2
232
+ python-dateutil==2.9.0
233
+ python-dateutil==2.9.0.post0
234
+ python-dotenv==1.0.1
235
+ python-multipart==0.0.9
236
+ pytz==2024.1
237
+ pyzmq==26.0.3
238
+ ranger-fm==1.9.3
239
+ ray==2.34.0
240
+ referencing==0.35.1
241
+ regex==2024.7.24
242
+ requests-toolbelt==1.0.0
243
+ requests==2.32.3
244
+ rfc3986==1.5.0
245
+ rich==13.1.0
246
+ rpds-py==0.19.1
247
+ ruamel.yaml.clib==0.2.8
248
+ ruamel.yaml==0.18.6
249
+ ruff==0.5.5
250
+ s3transfer==0.10.2
251
+ safetensors==0.4.3
252
+ scikit-learn==1.5.1
253
+ scipy==1.14.0
254
+ scmrepo==3.3.7
255
+ semantic-version==2.10.0
256
+ semver==3.0.2
257
+ sentencepiece==0.2.0
258
+ sentry-sdk==2.11.0
259
+ setproctitle==1.3.3
260
+ setuptools==71.0.4
261
+ shellingham==1.5.4
262
+ shortuuid==1.0.13
263
+ shtab==1.7.1
264
+ six==1.16.0
265
+ smmap==5.0.1
266
+ sniffio==1.3.1
267
+ soundfile==0.12.1
268
+ soxr==0.4.0
269
+ sqltrie==0.11.1
270
+ sse-starlette==2.1.3
271
+ stack-data==0.6.2
272
+ starlette==0.37.2
273
+ sympy==1.13.0
274
+ tabulate==0.9.0
275
+ tenacity==8.2.3
276
+ tensorboard-data-server==0.7.2
277
+ tensorboard==2.17.0
278
+ term-image==0.7.2
279
+ termcolor==2.4.0
280
+ threadpoolctl==3.5.0
281
+ tiktoken==0.7.0
282
+ tokenizers==0.19.1
283
+ tomli==2.0.1
284
+ tomlkit==0.12.0
285
+ torch==2.3.1
286
+ torch==2.4.0
287
+ torchaudio==2.4.0
288
+ torchvision==0.18.1
289
+ torchvision==0.19.0
290
+ tornado==6.4.1
291
+ tqdm==4.66.4
292
+ traitlets==5.14.3
293
+ transformers==4.45.0.dev0
294
+ treelib==1.6.4
295
+ triton==2.3.1
296
+ triton==3.0.0
297
+ trl==0.9.6
298
+ typeguard==4.3.0
299
+ typer==0.12.3
300
+ typing-inspect==0.9.0
301
+ typing_extensions==4.12.2
302
+ typing_extensions==4.12.2
303
+ tyro==0.8.10
304
+ tzdata==2024.1
305
+ urllib3==2.2.2
306
+ uvicorn==0.30.3
307
+ uvloop==0.19.0
308
+ vine==5.1.0
309
+ virtualenv==20.26.3
310
+ vllm-flash-attn==2.5.9.post1
311
+ vllm==0.5.3.post1
312
+ voluptuous==0.15.2
313
+ wandb==0.17.5
314
+ watchfiles==0.22.0
315
+ wcwidth==0.2.13
316
+ websockets==11.0.3
317
+ wheel==0.43.0
318
+ wheel==0.43.0
319
+ xformers==0.0.27
320
+ xxhash==3.4.1
321
+ yarl==1.9.4
322
+ zc.lockfile==3.0.post1
323
+ zipp==3.19.2
324
+ zipp==3.19.2
325
+ zstandard==0.23.0
wandb/run-20240921_050939-9z0w7l09/files/wandb-metadata.json ADDED
@@ -0,0 +1,1215 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "os": "Linux-5.15.0-1040-nvidia-x86_64-with-glibc2.35",
3
+ "python": "3.11.9",
4
+ "heartbeatAt": "2024-09-20T21:09:40.930520",
5
+ "startedAt": "2024-09-20T21:09:39.790516",
6
+ "docker": null,
7
+ "cuda": null,
8
+ "args": [
9
+ "--local_rank=0",
10
+ "--model_name_or_path",
11
+ "/aifs4su/yaodong/models/Qwen2-VL-7B-Instruct",
12
+ "--train_datasets",
13
+ "/aifs4su/yaodong/datasets/aaa_dataset/TV2T-preference/extracted",
14
+ "--output_dir",
15
+ "../outputs/dpo_tiv2t_1.5k_base",
16
+ "--train_data_files",
17
+ "extracted_preference_1.5k_washed.json",
18
+ "--train_template",
19
+ "NExTQA_preference",
20
+ "--train_split",
21
+ "train",
22
+ "--per_device_train_batch_size",
23
+ "1",
24
+ "--per_device_eval_batch_size",
25
+ "1",
26
+ "--gradient_accumulation_steps",
27
+ "1"
28
+ ],
29
+ "state": "running",
30
+ "program": "-m align_anything.trainers.tiv_to_t.dpo",
31
+ "codePathLocal": null,
32
+ "git": {
33
+ "remote": "git@github.com-hantao:htlou/align-anything.git",
34
+ "commit": "9eff99b0ee34f7265b8a2e1824650634c898f654"
35
+ },
36
+ "email": "2200017789@stu.pku.edu.cn",
37
+ "root": "/aifs4su/yaodong/projects/hantao/dev_cham/align-anything",
38
+ "host": "dgx-122",
39
+ "username": "yangyaodong",
40
+ "executable": "/aifs4su/yaodong/miniconda3/envs/hantao_tiv/bin/python3.11",
41
+ "cpu_count": 112,
42
+ "cpu_count_logical": 224,
43
+ "cpu_freq": {
44
+ "current": 2078.7158973214287,
45
+ "min": 800.0,
46
+ "max": 3800.0
47
+ },
48
+ "cpu_freq_per_core": [
49
+ {
50
+ "current": 2000.0,
51
+ "min": 800.0,
52
+ "max": 3800.0
53
+ },
54
+ {
55
+ "current": 2000.0,
56
+ "min": 800.0,
57
+ "max": 3800.0
58
+ },
59
+ {
60
+ "current": 2000.0,
61
+ "min": 800.0,
62
+ "max": 3800.0
63
+ },
64
+ {
65
+ "current": 2000.0,
66
+ "min": 800.0,
67
+ "max": 3800.0
68
+ },
69
+ {
70
+ "current": 2000.0,
71
+ "min": 800.0,
72
+ "max": 3800.0
73
+ },
74
+ {
75
+ "current": 2000.0,
76
+ "min": 800.0,
77
+ "max": 3800.0
78
+ },
79
+ {
80
+ "current": 2000.0,
81
+ "min": 800.0,
82
+ "max": 3800.0
83
+ },
84
+ {
85
+ "current": 2000.0,
86
+ "min": 800.0,
87
+ "max": 3800.0
88
+ },
89
+ {
90
+ "current": 2000.0,
91
+ "min": 800.0,
92
+ "max": 3800.0
93
+ },
94
+ {
95
+ "current": 2000.0,
96
+ "min": 800.0,
97
+ "max": 3800.0
98
+ },
99
+ {
100
+ "current": 2000.0,
101
+ "min": 800.0,
102
+ "max": 3800.0
103
+ },
104
+ {
105
+ "current": 2000.0,
106
+ "min": 800.0,
107
+ "max": 3800.0
108
+ },
109
+ {
110
+ "current": 2000.0,
111
+ "min": 800.0,
112
+ "max": 3800.0
113
+ },
114
+ {
115
+ "current": 2000.0,
116
+ "min": 800.0,
117
+ "max": 3800.0
118
+ },
119
+ {
120
+ "current": 3346.359,
121
+ "min": 800.0,
122
+ "max": 3800.0
123
+ },
124
+ {
125
+ "current": 2000.0,
126
+ "min": 800.0,
127
+ "max": 3800.0
128
+ },
129
+ {
130
+ "current": 3349.584,
131
+ "min": 800.0,
132
+ "max": 3800.0
133
+ },
134
+ {
135
+ "current": 2000.0,
136
+ "min": 800.0,
137
+ "max": 3800.0
138
+ },
139
+ {
140
+ "current": 2000.0,
141
+ "min": 800.0,
142
+ "max": 3800.0
143
+ },
144
+ {
145
+ "current": 2000.0,
146
+ "min": 800.0,
147
+ "max": 3800.0
148
+ },
149
+ {
150
+ "current": 2000.0,
151
+ "min": 800.0,
152
+ "max": 3800.0
153
+ },
154
+ {
155
+ "current": 3349.58,
156
+ "min": 800.0,
157
+ "max": 3800.0
158
+ },
159
+ {
160
+ "current": 2000.0,
161
+ "min": 800.0,
162
+ "max": 3800.0
163
+ },
164
+ {
165
+ "current": 2000.0,
166
+ "min": 800.0,
167
+ "max": 3800.0
168
+ },
169
+ {
170
+ "current": 3342.287,
171
+ "min": 800.0,
172
+ "max": 3800.0
173
+ },
174
+ {
175
+ "current": 2000.0,
176
+ "min": 800.0,
177
+ "max": 3800.0
178
+ },
179
+ {
180
+ "current": 2000.0,
181
+ "min": 800.0,
182
+ "max": 3800.0
183
+ },
184
+ {
185
+ "current": 3347.413,
186
+ "min": 800.0,
187
+ "max": 3800.0
188
+ },
189
+ {
190
+ "current": 2000.0,
191
+ "min": 800.0,
192
+ "max": 3800.0
193
+ },
194
+ {
195
+ "current": 2000.0,
196
+ "min": 800.0,
197
+ "max": 3800.0
198
+ },
199
+ {
200
+ "current": 2000.0,
201
+ "min": 800.0,
202
+ "max": 3800.0
203
+ },
204
+ {
205
+ "current": 2000.0,
206
+ "min": 800.0,
207
+ "max": 3800.0
208
+ },
209
+ {
210
+ "current": 2000.0,
211
+ "min": 800.0,
212
+ "max": 3800.0
213
+ },
214
+ {
215
+ "current": 2000.0,
216
+ "min": 800.0,
217
+ "max": 3800.0
218
+ },
219
+ {
220
+ "current": 2000.0,
221
+ "min": 800.0,
222
+ "max": 3800.0
223
+ },
224
+ {
225
+ "current": 2000.0,
226
+ "min": 800.0,
227
+ "max": 3800.0
228
+ },
229
+ {
230
+ "current": 2000.0,
231
+ "min": 800.0,
232
+ "max": 3800.0
233
+ },
234
+ {
235
+ "current": 2000.0,
236
+ "min": 800.0,
237
+ "max": 3800.0
238
+ },
239
+ {
240
+ "current": 2000.0,
241
+ "min": 800.0,
242
+ "max": 3800.0
243
+ },
244
+ {
245
+ "current": 2000.0,
246
+ "min": 800.0,
247
+ "max": 3800.0
248
+ },
249
+ {
250
+ "current": 2000.0,
251
+ "min": 800.0,
252
+ "max": 3800.0
253
+ },
254
+ {
255
+ "current": 2000.0,
256
+ "min": 800.0,
257
+ "max": 3800.0
258
+ },
259
+ {
260
+ "current": 2000.0,
261
+ "min": 800.0,
262
+ "max": 3800.0
263
+ },
264
+ {
265
+ "current": 2000.0,
266
+ "min": 800.0,
267
+ "max": 3800.0
268
+ },
269
+ {
270
+ "current": 3105.85,
271
+ "min": 800.0,
272
+ "max": 3800.0
273
+ },
274
+ {
275
+ "current": 2000.0,
276
+ "min": 800.0,
277
+ "max": 3800.0
278
+ },
279
+ {
280
+ "current": 2000.0,
281
+ "min": 800.0,
282
+ "max": 3800.0
283
+ },
284
+ {
285
+ "current": 2000.0,
286
+ "min": 800.0,
287
+ "max": 3800.0
288
+ },
289
+ {
290
+ "current": 2000.0,
291
+ "min": 800.0,
292
+ "max": 3800.0
293
+ },
294
+ {
295
+ "current": 2000.0,
296
+ "min": 800.0,
297
+ "max": 3800.0
298
+ },
299
+ {
300
+ "current": 2000.0,
301
+ "min": 800.0,
302
+ "max": 3800.0
303
+ },
304
+ {
305
+ "current": 2000.0,
306
+ "min": 800.0,
307
+ "max": 3800.0
308
+ },
309
+ {
310
+ "current": 2000.0,
311
+ "min": 800.0,
312
+ "max": 3800.0
313
+ },
314
+ {
315
+ "current": 2000.0,
316
+ "min": 800.0,
317
+ "max": 3800.0
318
+ },
319
+ {
320
+ "current": 2000.0,
321
+ "min": 800.0,
322
+ "max": 3800.0
323
+ },
324
+ {
325
+ "current": 2000.0,
326
+ "min": 800.0,
327
+ "max": 3800.0
328
+ },
329
+ {
330
+ "current": 2000.0,
331
+ "min": 800.0,
332
+ "max": 3800.0
333
+ },
334
+ {
335
+ "current": 3323.345,
336
+ "min": 800.0,
337
+ "max": 3800.0
338
+ },
339
+ {
340
+ "current": 2000.0,
341
+ "min": 800.0,
342
+ "max": 3800.0
343
+ },
344
+ {
345
+ "current": 2000.0,
346
+ "min": 800.0,
347
+ "max": 3800.0
348
+ },
349
+ {
350
+ "current": 2000.0,
351
+ "min": 800.0,
352
+ "max": 3800.0
353
+ },
354
+ {
355
+ "current": 2000.0,
356
+ "min": 800.0,
357
+ "max": 3800.0
358
+ },
359
+ {
360
+ "current": 2000.0,
361
+ "min": 800.0,
362
+ "max": 3800.0
363
+ },
364
+ {
365
+ "current": 2000.0,
366
+ "min": 800.0,
367
+ "max": 3800.0
368
+ },
369
+ {
370
+ "current": 2000.0,
371
+ "min": 800.0,
372
+ "max": 3800.0
373
+ },
374
+ {
375
+ "current": 2000.0,
376
+ "min": 800.0,
377
+ "max": 3800.0
378
+ },
379
+ {
380
+ "current": 2000.0,
381
+ "min": 800.0,
382
+ "max": 3800.0
383
+ },
384
+ {
385
+ "current": 2000.0,
386
+ "min": 800.0,
387
+ "max": 3800.0
388
+ },
389
+ {
390
+ "current": 2000.0,
391
+ "min": 800.0,
392
+ "max": 3800.0
393
+ },
394
+ {
395
+ "current": 2000.0,
396
+ "min": 800.0,
397
+ "max": 3800.0
398
+ },
399
+ {
400
+ "current": 2000.0,
401
+ "min": 800.0,
402
+ "max": 3800.0
403
+ },
404
+ {
405
+ "current": 2000.0,
406
+ "min": 800.0,
407
+ "max": 3800.0
408
+ },
409
+ {
410
+ "current": 2000.0,
411
+ "min": 800.0,
412
+ "max": 3800.0
413
+ },
414
+ {
415
+ "current": 2000.0,
416
+ "min": 800.0,
417
+ "max": 3800.0
418
+ },
419
+ {
420
+ "current": 2000.0,
421
+ "min": 800.0,
422
+ "max": 3800.0
423
+ },
424
+ {
425
+ "current": 2000.0,
426
+ "min": 800.0,
427
+ "max": 3800.0
428
+ },
429
+ {
430
+ "current": 2000.0,
431
+ "min": 800.0,
432
+ "max": 3800.0
433
+ },
434
+ {
435
+ "current": 2000.0,
436
+ "min": 800.0,
437
+ "max": 3800.0
438
+ },
439
+ {
440
+ "current": 2000.0,
441
+ "min": 800.0,
442
+ "max": 3800.0
443
+ },
444
+ {
445
+ "current": 2000.0,
446
+ "min": 800.0,
447
+ "max": 3800.0
448
+ },
449
+ {
450
+ "current": 2000.0,
451
+ "min": 800.0,
452
+ "max": 3800.0
453
+ },
454
+ {
455
+ "current": 2000.0,
456
+ "min": 800.0,
457
+ "max": 3800.0
458
+ },
459
+ {
460
+ "current": 2000.0,
461
+ "min": 800.0,
462
+ "max": 3800.0
463
+ },
464
+ {
465
+ "current": 2000.0,
466
+ "min": 800.0,
467
+ "max": 3800.0
468
+ },
469
+ {
470
+ "current": 2000.0,
471
+ "min": 800.0,
472
+ "max": 3800.0
473
+ },
474
+ {
475
+ "current": 2000.0,
476
+ "min": 800.0,
477
+ "max": 3800.0
478
+ },
479
+ {
480
+ "current": 2000.0,
481
+ "min": 800.0,
482
+ "max": 3800.0
483
+ },
484
+ {
485
+ "current": 2000.0,
486
+ "min": 800.0,
487
+ "max": 3800.0
488
+ },
489
+ {
490
+ "current": 2000.0,
491
+ "min": 800.0,
492
+ "max": 3800.0
493
+ },
494
+ {
495
+ "current": 2000.0,
496
+ "min": 800.0,
497
+ "max": 3800.0
498
+ },
499
+ {
500
+ "current": 2000.0,
501
+ "min": 800.0,
502
+ "max": 3800.0
503
+ },
504
+ {
505
+ "current": 2000.0,
506
+ "min": 800.0,
507
+ "max": 3800.0
508
+ },
509
+ {
510
+ "current": 2000.0,
511
+ "min": 800.0,
512
+ "max": 3800.0
513
+ },
514
+ {
515
+ "current": 2000.0,
516
+ "min": 800.0,
517
+ "max": 3800.0
518
+ },
519
+ {
520
+ "current": 2000.0,
521
+ "min": 800.0,
522
+ "max": 3800.0
523
+ },
524
+ {
525
+ "current": 2000.0,
526
+ "min": 800.0,
527
+ "max": 3800.0
528
+ },
529
+ {
530
+ "current": 2000.0,
531
+ "min": 800.0,
532
+ "max": 3800.0
533
+ },
534
+ {
535
+ "current": 2000.0,
536
+ "min": 800.0,
537
+ "max": 3800.0
538
+ },
539
+ {
540
+ "current": 2000.0,
541
+ "min": 800.0,
542
+ "max": 3800.0
543
+ },
544
+ {
545
+ "current": 2000.0,
546
+ "min": 800.0,
547
+ "max": 3800.0
548
+ },
549
+ {
550
+ "current": 3300.0,
551
+ "min": 800.0,
552
+ "max": 3800.0
553
+ },
554
+ {
555
+ "current": 2000.0,
556
+ "min": 800.0,
557
+ "max": 3800.0
558
+ },
559
+ {
560
+ "current": 2000.0,
561
+ "min": 800.0,
562
+ "max": 3800.0
563
+ },
564
+ {
565
+ "current": 2000.0,
566
+ "min": 800.0,
567
+ "max": 3800.0
568
+ },
569
+ {
570
+ "current": 2000.0,
571
+ "min": 800.0,
572
+ "max": 3800.0
573
+ },
574
+ {
575
+ "current": 2000.0,
576
+ "min": 800.0,
577
+ "max": 3800.0
578
+ },
579
+ {
580
+ "current": 2000.0,
581
+ "min": 800.0,
582
+ "max": 3800.0
583
+ },
584
+ {
585
+ "current": 2000.0,
586
+ "min": 800.0,
587
+ "max": 3800.0
588
+ },
589
+ {
590
+ "current": 2000.0,
591
+ "min": 800.0,
592
+ "max": 3800.0
593
+ },
594
+ {
595
+ "current": 2000.0,
596
+ "min": 800.0,
597
+ "max": 3800.0
598
+ },
599
+ {
600
+ "current": 2000.0,
601
+ "min": 800.0,
602
+ "max": 3800.0
603
+ },
604
+ {
605
+ "current": 2000.0,
606
+ "min": 800.0,
607
+ "max": 3800.0
608
+ },
609
+ {
610
+ "current": 2000.0,
611
+ "min": 800.0,
612
+ "max": 3800.0
613
+ },
614
+ {
615
+ "current": 2000.0,
616
+ "min": 800.0,
617
+ "max": 3800.0
618
+ },
619
+ {
620
+ "current": 3340.55,
621
+ "min": 800.0,
622
+ "max": 3800.0
623
+ },
624
+ {
625
+ "current": 2000.0,
626
+ "min": 800.0,
627
+ "max": 3800.0
628
+ },
629
+ {
630
+ "current": 2000.0,
631
+ "min": 800.0,
632
+ "max": 3800.0
633
+ },
634
+ {
635
+ "current": 2000.0,
636
+ "min": 800.0,
637
+ "max": 3800.0
638
+ },
639
+ {
640
+ "current": 2000.0,
641
+ "min": 800.0,
642
+ "max": 3800.0
643
+ },
644
+ {
645
+ "current": 2000.0,
646
+ "min": 800.0,
647
+ "max": 3800.0
648
+ },
649
+ {
650
+ "current": 2000.0,
651
+ "min": 800.0,
652
+ "max": 3800.0
653
+ },
654
+ {
655
+ "current": 2000.0,
656
+ "min": 800.0,
657
+ "max": 3800.0
658
+ },
659
+ {
660
+ "current": 2000.0,
661
+ "min": 800.0,
662
+ "max": 3800.0
663
+ },
664
+ {
665
+ "current": 2000.0,
666
+ "min": 800.0,
667
+ "max": 3800.0
668
+ },
669
+ {
670
+ "current": 2000.0,
671
+ "min": 800.0,
672
+ "max": 3800.0
673
+ },
674
+ {
675
+ "current": 2000.0,
676
+ "min": 800.0,
677
+ "max": 3800.0
678
+ },
679
+ {
680
+ "current": 2000.0,
681
+ "min": 800.0,
682
+ "max": 3800.0
683
+ },
684
+ {
685
+ "current": 2000.0,
686
+ "min": 800.0,
687
+ "max": 3800.0
688
+ },
689
+ {
690
+ "current": 2000.0,
691
+ "min": 800.0,
692
+ "max": 3800.0
693
+ },
694
+ {
695
+ "current": 2000.0,
696
+ "min": 800.0,
697
+ "max": 3800.0
698
+ },
699
+ {
700
+ "current": 2000.0,
701
+ "min": 800.0,
702
+ "max": 3800.0
703
+ },
704
+ {
705
+ "current": 2000.0,
706
+ "min": 800.0,
707
+ "max": 3800.0
708
+ },
709
+ {
710
+ "current": 2000.0,
711
+ "min": 800.0,
712
+ "max": 3800.0
713
+ },
714
+ {
715
+ "current": 2000.0,
716
+ "min": 800.0,
717
+ "max": 3800.0
718
+ },
719
+ {
720
+ "current": 2000.0,
721
+ "min": 800.0,
722
+ "max": 3800.0
723
+ },
724
+ {
725
+ "current": 2000.0,
726
+ "min": 800.0,
727
+ "max": 3800.0
728
+ },
729
+ {
730
+ "current": 2000.0,
731
+ "min": 800.0,
732
+ "max": 3800.0
733
+ },
734
+ {
735
+ "current": 2000.0,
736
+ "min": 800.0,
737
+ "max": 3800.0
738
+ },
739
+ {
740
+ "current": 2000.0,
741
+ "min": 800.0,
742
+ "max": 3800.0
743
+ },
744
+ {
745
+ "current": 2000.0,
746
+ "min": 800.0,
747
+ "max": 3800.0
748
+ },
749
+ {
750
+ "current": 2000.0,
751
+ "min": 800.0,
752
+ "max": 3800.0
753
+ },
754
+ {
755
+ "current": 2000.0,
756
+ "min": 800.0,
757
+ "max": 3800.0
758
+ },
759
+ {
760
+ "current": 3360.628,
761
+ "min": 800.0,
762
+ "max": 3800.0
763
+ },
764
+ {
765
+ "current": 2000.0,
766
+ "min": 800.0,
767
+ "max": 3800.0
768
+ },
769
+ {
770
+ "current": 2000.0,
771
+ "min": 800.0,
772
+ "max": 3800.0
773
+ },
774
+ {
775
+ "current": 2000.0,
776
+ "min": 800.0,
777
+ "max": 3800.0
778
+ },
779
+ {
780
+ "current": 2000.0,
781
+ "min": 800.0,
782
+ "max": 3800.0
783
+ },
784
+ {
785
+ "current": 2000.0,
786
+ "min": 800.0,
787
+ "max": 3800.0
788
+ },
789
+ {
790
+ "current": 2000.0,
791
+ "min": 800.0,
792
+ "max": 3800.0
793
+ },
794
+ {
795
+ "current": 2000.0,
796
+ "min": 800.0,
797
+ "max": 3800.0
798
+ },
799
+ {
800
+ "current": 2000.0,
801
+ "min": 800.0,
802
+ "max": 3800.0
803
+ },
804
+ {
805
+ "current": 2000.0,
806
+ "min": 800.0,
807
+ "max": 3800.0
808
+ },
809
+ {
810
+ "current": 2000.0,
811
+ "min": 800.0,
812
+ "max": 3800.0
813
+ },
814
+ {
815
+ "current": 2000.0,
816
+ "min": 800.0,
817
+ "max": 3800.0
818
+ },
819
+ {
820
+ "current": 2000.0,
821
+ "min": 800.0,
822
+ "max": 3800.0
823
+ },
824
+ {
825
+ "current": 2000.0,
826
+ "min": 800.0,
827
+ "max": 3800.0
828
+ },
829
+ {
830
+ "current": 2000.0,
831
+ "min": 800.0,
832
+ "max": 3800.0
833
+ },
834
+ {
835
+ "current": 3349.649,
836
+ "min": 800.0,
837
+ "max": 3800.0
838
+ },
839
+ {
840
+ "current": 2000.0,
841
+ "min": 800.0,
842
+ "max": 3800.0
843
+ },
844
+ {
845
+ "current": 2000.0,
846
+ "min": 800.0,
847
+ "max": 3800.0
848
+ },
849
+ {
850
+ "current": 2000.0,
851
+ "min": 800.0,
852
+ "max": 3800.0
853
+ },
854
+ {
855
+ "current": 2000.0,
856
+ "min": 800.0,
857
+ "max": 3800.0
858
+ },
859
+ {
860
+ "current": 2000.0,
861
+ "min": 800.0,
862
+ "max": 3800.0
863
+ },
864
+ {
865
+ "current": 2000.0,
866
+ "min": 800.0,
867
+ "max": 3800.0
868
+ },
869
+ {
870
+ "current": 2000.0,
871
+ "min": 800.0,
872
+ "max": 3800.0
873
+ },
874
+ {
875
+ "current": 2000.0,
876
+ "min": 800.0,
877
+ "max": 3800.0
878
+ },
879
+ {
880
+ "current": 2000.0,
881
+ "min": 800.0,
882
+ "max": 3800.0
883
+ },
884
+ {
885
+ "current": 2000.0,
886
+ "min": 800.0,
887
+ "max": 3800.0
888
+ },
889
+ {
890
+ "current": 2000.0,
891
+ "min": 800.0,
892
+ "max": 3800.0
893
+ },
894
+ {
895
+ "current": 2000.0,
896
+ "min": 800.0,
897
+ "max": 3800.0
898
+ },
899
+ {
900
+ "current": 2000.0,
901
+ "min": 800.0,
902
+ "max": 3800.0
903
+ },
904
+ {
905
+ "current": 2000.0,
906
+ "min": 800.0,
907
+ "max": 3800.0
908
+ },
909
+ {
910
+ "current": 2000.0,
911
+ "min": 800.0,
912
+ "max": 3800.0
913
+ },
914
+ {
915
+ "current": 2000.0,
916
+ "min": 800.0,
917
+ "max": 3800.0
918
+ },
919
+ {
920
+ "current": 2000.0,
921
+ "min": 800.0,
922
+ "max": 3800.0
923
+ },
924
+ {
925
+ "current": 2000.0,
926
+ "min": 800.0,
927
+ "max": 3800.0
928
+ },
929
+ {
930
+ "current": 2000.0,
931
+ "min": 800.0,
932
+ "max": 3800.0
933
+ },
934
+ {
935
+ "current": 2000.0,
936
+ "min": 800.0,
937
+ "max": 3800.0
938
+ },
939
+ {
940
+ "current": 2000.0,
941
+ "min": 800.0,
942
+ "max": 3800.0
943
+ },
944
+ {
945
+ "current": 2000.0,
946
+ "min": 800.0,
947
+ "max": 3800.0
948
+ },
949
+ {
950
+ "current": 2000.0,
951
+ "min": 800.0,
952
+ "max": 3800.0
953
+ },
954
+ {
955
+ "current": 2000.0,
956
+ "min": 800.0,
957
+ "max": 3800.0
958
+ },
959
+ {
960
+ "current": 2000.0,
961
+ "min": 800.0,
962
+ "max": 3800.0
963
+ },
964
+ {
965
+ "current": 2000.0,
966
+ "min": 800.0,
967
+ "max": 3800.0
968
+ },
969
+ {
970
+ "current": 2000.0,
971
+ "min": 800.0,
972
+ "max": 3800.0
973
+ },
974
+ {
975
+ "current": 2000.0,
976
+ "min": 800.0,
977
+ "max": 3800.0
978
+ },
979
+ {
980
+ "current": 2000.0,
981
+ "min": 800.0,
982
+ "max": 3800.0
983
+ },
984
+ {
985
+ "current": 2000.0,
986
+ "min": 800.0,
987
+ "max": 3800.0
988
+ },
989
+ {
990
+ "current": 2000.0,
991
+ "min": 800.0,
992
+ "max": 3800.0
993
+ },
994
+ {
995
+ "current": 2000.0,
996
+ "min": 800.0,
997
+ "max": 3800.0
998
+ },
999
+ {
1000
+ "current": 2000.0,
1001
+ "min": 800.0,
1002
+ "max": 3800.0
1003
+ },
1004
+ {
1005
+ "current": 2000.0,
1006
+ "min": 800.0,
1007
+ "max": 3800.0
1008
+ },
1009
+ {
1010
+ "current": 2000.0,
1011
+ "min": 800.0,
1012
+ "max": 3800.0
1013
+ },
1014
+ {
1015
+ "current": 2000.0,
1016
+ "min": 800.0,
1017
+ "max": 3800.0
1018
+ },
1019
+ {
1020
+ "current": 2000.0,
1021
+ "min": 800.0,
1022
+ "max": 3800.0
1023
+ },
1024
+ {
1025
+ "current": 3324.304,
1026
+ "min": 800.0,
1027
+ "max": 3800.0
1028
+ },
1029
+ {
1030
+ "current": 2000.0,
1031
+ "min": 800.0,
1032
+ "max": 3800.0
1033
+ },
1034
+ {
1035
+ "current": 2000.0,
1036
+ "min": 800.0,
1037
+ "max": 3800.0
1038
+ },
1039
+ {
1040
+ "current": 2000.0,
1041
+ "min": 800.0,
1042
+ "max": 3800.0
1043
+ },
1044
+ {
1045
+ "current": 2000.0,
1046
+ "min": 800.0,
1047
+ "max": 3800.0
1048
+ },
1049
+ {
1050
+ "current": 2000.0,
1051
+ "min": 800.0,
1052
+ "max": 3800.0
1053
+ },
1054
+ {
1055
+ "current": 2000.0,
1056
+ "min": 800.0,
1057
+ "max": 3800.0
1058
+ },
1059
+ {
1060
+ "current": 2000.0,
1061
+ "min": 800.0,
1062
+ "max": 3800.0
1063
+ },
1064
+ {
1065
+ "current": 2000.0,
1066
+ "min": 800.0,
1067
+ "max": 3800.0
1068
+ },
1069
+ {
1070
+ "current": 2000.0,
1071
+ "min": 800.0,
1072
+ "max": 3800.0
1073
+ },
1074
+ {
1075
+ "current": 2000.0,
1076
+ "min": 800.0,
1077
+ "max": 3800.0
1078
+ },
1079
+ {
1080
+ "current": 2000.0,
1081
+ "min": 800.0,
1082
+ "max": 3800.0
1083
+ },
1084
+ {
1085
+ "current": 2000.0,
1086
+ "min": 800.0,
1087
+ "max": 3800.0
1088
+ },
1089
+ {
1090
+ "current": 2000.0,
1091
+ "min": 800.0,
1092
+ "max": 3800.0
1093
+ },
1094
+ {
1095
+ "current": 2000.0,
1096
+ "min": 800.0,
1097
+ "max": 3800.0
1098
+ },
1099
+ {
1100
+ "current": 2000.0,
1101
+ "min": 800.0,
1102
+ "max": 3800.0
1103
+ },
1104
+ {
1105
+ "current": 3324.784,
1106
+ "min": 800.0,
1107
+ "max": 3800.0
1108
+ },
1109
+ {
1110
+ "current": 2000.0,
1111
+ "min": 800.0,
1112
+ "max": 3800.0
1113
+ },
1114
+ {
1115
+ "current": 2000.0,
1116
+ "min": 800.0,
1117
+ "max": 3800.0
1118
+ },
1119
+ {
1120
+ "current": 2000.0,
1121
+ "min": 800.0,
1122
+ "max": 3800.0
1123
+ },
1124
+ {
1125
+ "current": 2000.0,
1126
+ "min": 800.0,
1127
+ "max": 3800.0
1128
+ },
1129
+ {
1130
+ "current": 2000.0,
1131
+ "min": 800.0,
1132
+ "max": 3800.0
1133
+ },
1134
+ {
1135
+ "current": 2000.0,
1136
+ "min": 800.0,
1137
+ "max": 3800.0
1138
+ },
1139
+ {
1140
+ "current": 2000.0,
1141
+ "min": 800.0,
1142
+ "max": 3800.0
1143
+ },
1144
+ {
1145
+ "current": 2000.0,
1146
+ "min": 800.0,
1147
+ "max": 3800.0
1148
+ },
1149
+ {
1150
+ "current": 2000.0,
1151
+ "min": 800.0,
1152
+ "max": 3800.0
1153
+ },
1154
+ {
1155
+ "current": 2000.0,
1156
+ "min": 800.0,
1157
+ "max": 3800.0
1158
+ },
1159
+ {
1160
+ "current": 2000.0,
1161
+ "min": 800.0,
1162
+ "max": 3800.0
1163
+ },
1164
+ {
1165
+ "current": 2000.0,
1166
+ "min": 800.0,
1167
+ "max": 3800.0
1168
+ }
1169
+ ],
1170
+ "disk": {
1171
+ "/": {
1172
+ "total": 1758.8549690246582,
1173
+ "used": 114.58099365234375
1174
+ }
1175
+ },
1176
+ "gpu": "NVIDIA H800",
1177
+ "gpu_count": 8,
1178
+ "gpu_devices": [
1179
+ {
1180
+ "name": "NVIDIA H800",
1181
+ "memory_total": 85520809984
1182
+ },
1183
+ {
1184
+ "name": "NVIDIA H800",
1185
+ "memory_total": 85520809984
1186
+ },
1187
+ {
1188
+ "name": "NVIDIA H800",
1189
+ "memory_total": 85520809984
1190
+ },
1191
+ {
1192
+ "name": "NVIDIA H800",
1193
+ "memory_total": 85520809984
1194
+ },
1195
+ {
1196
+ "name": "NVIDIA H800",
1197
+ "memory_total": 85520809984
1198
+ },
1199
+ {
1200
+ "name": "NVIDIA H800",
1201
+ "memory_total": 85520809984
1202
+ },
1203
+ {
1204
+ "name": "NVIDIA H800",
1205
+ "memory_total": 85520809984
1206
+ },
1207
+ {
1208
+ "name": "NVIDIA H800",
1209
+ "memory_total": 85520809984
1210
+ }
1211
+ ],
1212
+ "memory": {
1213
+ "total": 2015.564224243164
1214
+ }
1215
+ }
wandb/run-20240921_050939-9z0w7l09/files/wandb-summary.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"train/step": 148, "train/loss": 0.6364923119544983, "train/reward": -7.709503173828125, "train/better_sample_reward": -2.553741693496704, "train/worse_sample_reward": -5.15576171875, "train/reward_accuracy": 0.75, "train/reward_margin": 2.602020263671875, "train/lr": 8.284550220824186e-07, "train/epoch": 0.8361581920903954, "_timestamp": 1726868060.069517, "_runtime": 1480.246605873108, "_step": 148, "_wandb": {"runtime": 1489}}
wandb/run-20240921_050939-9z0w7l09/logs/debug-internal.log ADDED
The diff for this file is too large to render. See raw diff
 
wandb/run-20240921_050939-9z0w7l09/logs/debug.log ADDED
@@ -0,0 +1,36 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ 2024-09-21 05:09:39,806 INFO MainThread:730272 [wandb_setup.py:_flush():76] Current SDK version is 0.17.5
2
+ 2024-09-21 05:09:39,806 INFO MainThread:730272 [wandb_setup.py:_flush():76] Configure stats pid to 730272
3
+ 2024-09-21 05:09:39,806 INFO MainThread:730272 [wandb_setup.py:_flush():76] Loading settings from /home/yangyaodong/.config/wandb/settings
4
+ 2024-09-21 05:09:39,806 INFO MainThread:730272 [wandb_setup.py:_flush():76] Loading settings from /aifs4su/yaodong/projects/hantao/dev_cham/align-anything/scripts/wandb/settings
5
+ 2024-09-21 05:09:39,806 INFO MainThread:730272 [wandb_setup.py:_flush():76] Loading settings from environment variables: {'api_key': '***REDACTED***'}
6
+ 2024-09-21 05:09:39,806 INFO MainThread:730272 [wandb_setup.py:_flush():76] Applying setup settings: {'_disable_service': False}
7
+ 2024-09-21 05:09:39,806 WARNING MainThread:730272 [wandb_setup.py:_flush():76] Could not find program at -m align_anything.trainers.tiv_to_t.dpo
8
+ 2024-09-21 05:09:39,806 INFO MainThread:730272 [wandb_setup.py:_flush():76] Inferring run settings from compute environment: {'program_relpath': None, 'program': '-m align_anything.trainers.tiv_to_t.dpo'}
9
+ 2024-09-21 05:09:39,806 INFO MainThread:730272 [wandb_setup.py:_flush():76] Applying login settings: {}
10
+ 2024-09-21 05:09:39,806 INFO MainThread:730272 [wandb_init.py:_log_setup():529] Logging user logs to ../outputs/dpo_tiv2t_1.5k_base/wandb/run-20240921_050939-9z0w7l09/logs/debug.log
11
+ 2024-09-21 05:09:39,807 INFO MainThread:730272 [wandb_init.py:_log_setup():530] Logging internal logs to ../outputs/dpo_tiv2t_1.5k_base/wandb/run-20240921_050939-9z0w7l09/logs/debug-internal.log
12
+ 2024-09-21 05:09:39,807 INFO MainThread:730272 [wandb_init.py:init():569] calling init triggers
13
+ 2024-09-21 05:09:39,807 INFO MainThread:730272 [wandb_init.py:init():576] wandb.init called with sweep_config: {}
14
+ config: {'train_cfgs': {'ds_cfgs': 'ds_z3_config.json', 'epochs': 3, 'seed': 42, 'per_device_train_batch_size': 1.0, 'per_device_eval_batch_size': 1.0, 'gradient_accumulation_steps': 1.0, 'gradient_checkpointing': True, 'learning_rate': 1e-06, 'lr_scheduler_type': 'cosine', 'lr_warmup_ratio': 0.01, 'weight_decay': 0.0, 'adam_betas': [0.9, 0.95], 'bf16': True, 'fp16': False, 'eval_strategy': 'epoch', 'eval_interval': 10, 'regularization': 0.001, 'scale_coeff': 0.1, 'freeze_mm_proj': False, 'freeze_vision_tower': True, 'freeze_language_model': False}, 'data_cfgs': {'train_datasets': '/aifs4su/yaodong/datasets/aaa_dataset/TV2T-preference/extracted', 'train_template': 'NExTQA_preference', 'train_size': None, 'train_split': 'train', 'train_subset': None, 'train_data_files': 'extracted_preference_1.5k_washed.json', 'train_optional_args': [], 'eval_datasets': None, 'eval_template': None, 'eval_size': None, 'eval_split': None, 'eval_subset': None, 'eval_data_files': None, 'eval_optional_args': []}, 'logger_cfgs': {'log_type': 'wandb', 'log_project': 'align-anything', 'log_run_name': 'dpo', 'output_dir': '../outputs/dpo_tiv2t_1.5k_base', 'cache_dir': None, 'save_interval': 100000}, 'model_cfgs': {'model_name_or_path': '/aifs4su/yaodong/models/Qwen2-VL-7B-Instruct', 'trust_remote_code': True, 'model_max_length': 4096}, 'special_tokens': None}
15
+ 2024-09-21 05:09:39,807 INFO MainThread:730272 [wandb_init.py:init():619] starting backend
16
+ 2024-09-21 05:09:39,807 INFO MainThread:730272 [wandb_init.py:init():623] setting up manager
17
+ 2024-09-21 05:09:39,809 INFO MainThread:730272 [backend.py:_multiprocessing_setup():105] multiprocessing start_methods=fork,spawn,forkserver, using: spawn
18
+ 2024-09-21 05:09:39,822 INFO MainThread:730272 [wandb_init.py:init():631] backend started and connected
19
+ 2024-09-21 05:09:39,827 INFO MainThread:730272 [wandb_init.py:init():720] updated telemetry
20
+ 2024-09-21 05:09:39,856 INFO MainThread:730272 [wandb_init.py:init():753] communicating run to backend with 90.0 second timeout
21
+ 2024-09-21 05:09:40,452 INFO MainThread:730272 [wandb_run.py:_on_init():2435] communicating current version
22
+ 2024-09-21 05:09:40,618 INFO MainThread:730272 [wandb_run.py:_on_init():2444] got version response upgrade_message: "wandb version 0.18.1 is available! To upgrade, please run:\n $ pip install wandb --upgrade"
23
+
24
+ 2024-09-21 05:09:40,619 INFO MainThread:730272 [wandb_init.py:init():804] starting run threads in backend
25
+ 2024-09-21 05:09:46,898 INFO MainThread:730272 [wandb_run.py:_console_start():2413] atexit reg
26
+ 2024-09-21 05:09:46,898 INFO MainThread:730272 [wandb_run.py:_redirect():2255] redirect: wrap_raw
27
+ 2024-09-21 05:09:46,898 INFO MainThread:730272 [wandb_run.py:_redirect():2320] Wrapping output streams.
28
+ 2024-09-21 05:09:46,898 INFO MainThread:730272 [wandb_run.py:_redirect():2345] Redirects installed.
29
+ 2024-09-21 05:09:46,902 INFO MainThread:730272 [wandb_init.py:init():847] run started, returning control to user process
30
+ 2024-09-21 05:34:29,563 INFO MainThread:730272 [wandb_run.py:_finish():2107] finishing run htlou/align-anything/9z0w7l09
31
+ 2024-09-21 05:34:29,563 INFO MainThread:730272 [wandb_run.py:_atexit_cleanup():2374] got exitcode: 0
32
+ 2024-09-21 05:34:29,563 INFO MainThread:730272 [wandb_run.py:_restore():2352] restore
33
+ 2024-09-21 05:34:29,564 INFO MainThread:730272 [wandb_run.py:_restore():2358] restore done
34
+ 2024-09-21 05:34:37,880 INFO MainThread:730272 [wandb_run.py:_footer_history_summary_info():4016] rendering history
35
+ 2024-09-21 05:34:37,881 INFO MainThread:730272 [wandb_run.py:_footer_history_summary_info():4048] rendering summary
36
+ 2024-09-21 05:34:37,886 INFO MainThread:730272 [wandb_run.py:_footer_sync_info():3975] logging synced files
wandb/run-20240921_050939-9z0w7l09/run-9z0w7l09.wandb ADDED
Binary file (577 kB). View file
 
wandb/run-20240921_103042-1p62y7m7/files/conda-environment.yaml ADDED
@@ -0,0 +1,516 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ name: hantao_tiv
2
+ channels:
3
+ - nvidia/label/cuda-12.1.0
4
+ - nvidia
5
+ - pytorch
6
+ - huggingface
7
+ - conda-forge
8
+ - defaults
9
+ dependencies:
10
+ - _libgcc_mutex=0.1=conda_forge
11
+ - _openmp_mutex=4.5=2_gnu
12
+ - aom=3.9.1=hac33072_0
13
+ - asttokens=2.4.1=pyhd8ed1ab_0
14
+ - blas=1.0=mkl
15
+ - brotli-python=1.1.0=py311hb755f60_1
16
+ - bzip2=1.0.8=h4bc722e_7
17
+ - ca-certificates=2024.7.4=hbcca054_0
18
+ - cairo=1.18.0=hebfffa5_3
19
+ - certifi=2024.7.4=pyhd8ed1ab_0
20
+ - cffi=1.16.0=py311hb3a22ac_0
21
+ - charset-normalizer=3.3.2=pyhd8ed1ab_0
22
+ - comm=0.2.2=pyhd8ed1ab_0
23
+ - cuda=12.1.0=0
24
+ - cuda-cccl=12.1.55=0
25
+ - cuda-command-line-tools=12.1.0=0
26
+ - cuda-compiler=12.1.0=0
27
+ - cuda-cudart=12.1.55=0
28
+ - cuda-cudart-dev=12.1.55=0
29
+ - cuda-cudart-static=12.1.55=0
30
+ - cuda-cuobjdump=12.1.55=0
31
+ - cuda-cupti=12.1.62=0
32
+ - cuda-cupti-static=12.1.62=0
33
+ - cuda-cuxxfilt=12.1.55=0
34
+ - cuda-demo-suite=12.1.55=0
35
+ - cuda-documentation=12.1.55=0
36
+ - cuda-driver-dev=12.1.55=0
37
+ - cuda-gdb=12.1.55=0
38
+ - cuda-libraries=12.1.0=0
39
+ - cuda-libraries-dev=12.1.0=0
40
+ - cuda-libraries-static=12.1.0=0
41
+ - cuda-nsight=12.1.55=0
42
+ - cuda-nsight-compute=12.1.0=0
43
+ - cuda-nvcc=12.1.66=0
44
+ - cuda-nvdisasm=12.1.55=0
45
+ - cuda-nvml-dev=12.1.55=0
46
+ - cuda-nvprof=12.1.55=0
47
+ - cuda-nvprune=12.1.55=0
48
+ - cuda-nvrtc=12.1.55=0
49
+ - cuda-nvrtc-dev=12.1.55=0
50
+ - cuda-nvrtc-static=12.1.55=0
51
+ - cuda-nvtx=12.1.66=0
52
+ - cuda-nvvp=12.1.55=0
53
+ - cuda-opencl=12.1.56=0
54
+ - cuda-opencl-dev=12.1.56=0
55
+ - cuda-profiler-api=12.1.55=0
56
+ - cuda-runtime=12.1.0=0
57
+ - cuda-sanitizer-api=12.1.55=0
58
+ - cuda-toolkit=12.1.0=0
59
+ - cuda-tools=12.1.0=0
60
+ - cuda-visual-tools=12.1.0=0
61
+ - dav1d=1.2.1=hd590300_0
62
+ - debugpy=1.8.2=py311h4332511_0
63
+ - exceptiongroup=1.2.2=pyhd8ed1ab_0
64
+ - executing=2.0.1=pyhd8ed1ab_0
65
+ - expat=2.6.2=h59595ed_0
66
+ - ffmpeg=7.0.1=gpl_h9be9148_104
67
+ - filelock=3.15.4=pyhd8ed1ab_0
68
+ - font-ttf-dejavu-sans-mono=2.37=hab24e00_0
69
+ - font-ttf-inconsolata=3.000=h77eed37_0
70
+ - font-ttf-source-code-pro=2.038=h77eed37_0
71
+ - font-ttf-ubuntu=0.83=h77eed37_2
72
+ - fontconfig=2.14.2=h14ed4e7_0
73
+ - fonts-conda-ecosystem=1=0
74
+ - fonts-conda-forge=1=0
75
+ - freetype=2.12.1=h267a509_2
76
+ - fribidi=1.0.10=h36c2ea0_0
77
+ - gds-tools=1.6.0.25=0
78
+ - gettext=0.22.5=h59595ed_2
79
+ - gettext-tools=0.22.5=h59595ed_2
80
+ - git-lfs=3.5.1=ha770c72_0
81
+ - gmp=6.3.0=hac33072_2
82
+ - gmpy2=2.1.5=py311hc4f1f91_1
83
+ - gnutls=3.7.9=hb077bed_0
84
+ - graphite2=1.3.13=h59595ed_1003
85
+ - h2=4.1.0=pyhd8ed1ab_0
86
+ - harfbuzz=9.0.0=hda332d3_1
87
+ - hpack=4.0.0=pyh9f0ad1d_0
88
+ - hyperframe=6.0.1=pyhd8ed1ab_0
89
+ - icu=75.1=he02047a_0
90
+ - idna=3.7=pyhd8ed1ab_0
91
+ - importlib-metadata=8.2.0=pyha770c72_0
92
+ - importlib_metadata=8.2.0=hd8ed1ab_0
93
+ - intel-openmp=2022.0.1=h06a4308_3633
94
+ - ipykernel=6.29.5=pyh3099207_0
95
+ - ipython=8.26.0=pyh707e725_0
96
+ - jedi=0.19.1=pyhd8ed1ab_0
97
+ - jinja2=3.1.4=pyhd8ed1ab_0
98
+ - jupyter_client=8.6.2=pyhd8ed1ab_0
99
+ - jupyter_core=5.7.2=py311h38be061_0
100
+ - keyutils=1.6.1=h166bdaf_0
101
+ - krb5=1.21.3=h659f571_0
102
+ - lame=3.100=h166bdaf_1003
103
+ - lcms2=2.16=hb7c19ff_0
104
+ - ld_impl_linux-64=2.40=hf3520f5_7
105
+ - lerc=4.0.0=h27087fc_0
106
+ - libabseil=20240116.2=cxx17_he02047a_1
107
+ - libasprintf=0.22.5=h661eb56_2
108
+ - libasprintf-devel=0.22.5=h661eb56_2
109
+ - libass=0.17.1=h39113c1_2
110
+ - libblas=3.9.0=16_linux64_mkl
111
+ - libcblas=3.9.0=16_linux64_mkl
112
+ - libcublas=12.1.0.26=0
113
+ - libcublas-dev=12.1.0.26=0
114
+ - libcublas-static=12.1.0.26=0
115
+ - libcufft=11.0.2.4=0
116
+ - libcufft-dev=11.0.2.4=0
117
+ - libcufft-static=11.0.2.4=0
118
+ - libcufile=1.6.0.25=0
119
+ - libcufile-dev=1.6.0.25=0
120
+ - libcufile-static=1.6.0.25=0
121
+ - libcurand=10.3.2.56=0
122
+ - libcurand-dev=10.3.2.56=0
123
+ - libcurand-static=10.3.2.56=0
124
+ - libcusolver=11.4.4.55=0
125
+ - libcusolver-dev=11.4.4.55=0
126
+ - libcusolver-static=11.4.4.55=0
127
+ - libcusparse=12.0.2.55=0
128
+ - libcusparse-dev=12.0.2.55=0
129
+ - libcusparse-static=12.0.2.55=0
130
+ - libdeflate=1.20=hd590300_0
131
+ - libdrm=2.4.122=h4ab18f5_0
132
+ - libedit=3.1.20191231=he28a2e2_2
133
+ - libexpat=2.6.2=h59595ed_0
134
+ - libffi=3.4.2=h7f98852_5
135
+ - libgcc-ng=14.1.0=h77fa898_0
136
+ - libgettextpo=0.22.5=h59595ed_2
137
+ - libgettextpo-devel=0.22.5=h59595ed_2
138
+ - libglib=2.80.3=h8a4344b_1
139
+ - libgomp=14.1.0=h77fa898_0
140
+ - libhwloc=2.11.1=default_hecaa2ac_1000
141
+ - libiconv=1.17=hd590300_2
142
+ - libidn2=2.3.7=hd590300_0
143
+ - libjpeg-turbo=3.0.0=hd590300_1
144
+ - liblapack=3.9.0=16_linux64_mkl
145
+ - libnpp=12.0.2.50=0
146
+ - libnpp-dev=12.0.2.50=0
147
+ - libnpp-static=12.0.2.50=0
148
+ - libnsl=2.0.1=hd590300_0
149
+ - libnvjitlink=12.1.105=0
150
+ - libnvjitlink-dev=12.1.55=0
151
+ - libnvjpeg=12.1.0.39=0
152
+ - libnvjpeg-dev=12.1.0.39=0
153
+ - libnvjpeg-static=12.1.0.39=0
154
+ - libnvvm-samples=12.1.55=0
155
+ - libopenvino=2024.2.0=h2da1b83_1
156
+ - libopenvino-auto-batch-plugin=2024.2.0=hb045406_1
157
+ - libopenvino-auto-plugin=2024.2.0=hb045406_1
158
+ - libopenvino-hetero-plugin=2024.2.0=h5c03a75_1
159
+ - libopenvino-intel-cpu-plugin=2024.2.0=h2da1b83_1
160
+ - libopenvino-intel-gpu-plugin=2024.2.0=h2da1b83_1
161
+ - libopenvino-intel-npu-plugin=2024.2.0=he02047a_1
162
+ - libopenvino-ir-frontend=2024.2.0=h5c03a75_1
163
+ - libopenvino-onnx-frontend=2024.2.0=h07e8aee_1
164
+ - libopenvino-paddle-frontend=2024.2.0=h07e8aee_1
165
+ - libopenvino-pytorch-frontend=2024.2.0=he02047a_1
166
+ - libopenvino-tensorflow-frontend=2024.2.0=h39126c6_1
167
+ - libopenvino-tensorflow-lite-frontend=2024.2.0=he02047a_1
168
+ - libopus=1.3.1=h7f98852_1
169
+ - libpciaccess=0.18=hd590300_0
170
+ - libpng=1.6.43=h2797004_0
171
+ - libprotobuf=4.25.3=h08a7969_0
172
+ - libsodium=1.0.18=h36c2ea0_1
173
+ - libsqlite=3.46.0=hde9e2c9_0
174
+ - libstdcxx-ng=14.1.0=hc0a3c3a_0
175
+ - libtasn1=4.19.0=h166bdaf_0
176
+ - libtiff=4.6.0=h1dd3fc0_3
177
+ - libunistring=0.9.10=h7f98852_0
178
+ - libuuid=2.38.1=h0b41bf4_0
179
+ - libva=2.22.0=hb711507_0
180
+ - libvpx=1.14.1=hac33072_0
181
+ - libwebp-base=1.4.0=hd590300_0
182
+ - libxcb=1.16=hd590300_0
183
+ - libxcrypt=4.4.36=hd590300_1
184
+ - libxml2=2.12.7=he7c6b58_4
185
+ - libzlib=1.3.1=h4ab18f5_1
186
+ - llvm-openmp=15.0.7=h0cdce71_0
187
+ - markupsafe=2.1.5=py311h459d7ec_0
188
+ - matplotlib-inline=0.1.7=pyhd8ed1ab_0
189
+ - mkl=2022.1.0=hc2b9512_224
190
+ - mpc=1.3.1=hfe3b2da_0
191
+ - mpfr=4.2.1=h38ae2d0_2
192
+ - mpmath=1.3.0=pyhd8ed1ab_0
193
+ - ncurses=6.5=h59595ed_0
194
+ - nest-asyncio=1.6.0=pyhd8ed1ab_0
195
+ - nettle=3.9.1=h7ab15ed_0
196
+ - networkx=3.3=pyhd8ed1ab_1
197
+ - nsight-compute=2023.1.0.15=0
198
+ - ocl-icd=2.3.2=hd590300_1
199
+ - openh264=2.4.1=h59595ed_0
200
+ - openjpeg=2.5.2=h488ebb8_0
201
+ - openssl=3.3.1=h4bc722e_2
202
+ - p11-kit=0.24.1=hc5aa10d_0
203
+ - packaging=24.1=pyhd8ed1ab_0
204
+ - parso=0.8.4=pyhd8ed1ab_0
205
+ - pcre2=10.44=h0f59acf_0
206
+ - pexpect=4.9.0=pyhd8ed1ab_0
207
+ - pickleshare=0.7.5=py_1003
208
+ - pillow=10.4.0=py311h82a398c_0
209
+ - pip=24.0=pyhd8ed1ab_0
210
+ - pixman=0.43.2=h59595ed_0
211
+ - prompt-toolkit=3.0.47=pyha770c72_0
212
+ - psutil=6.0.0=py311h331c9d8_0
213
+ - pthread-stubs=0.4=h36c2ea0_1001
214
+ - ptyprocess=0.7.0=pyhd3deb0d_0
215
+ - pugixml=1.14=h59595ed_0
216
+ - pure_eval=0.2.3=pyhd8ed1ab_0
217
+ - pycparser=2.22=pyhd8ed1ab_0
218
+ - pygments=2.18.0=pyhd8ed1ab_0
219
+ - pysocks=1.7.1=pyha2e5f31_6
220
+ - python=3.11.9=hb806964_0_cpython
221
+ - python_abi=3.11=4_cp311
222
+ - pytorch=2.4.0=py3.11_cuda12.1_cudnn9.1.0_0
223
+ - pytorch-cuda=12.1=ha16c6d3_5
224
+ - pytorch-mutex=1.0=cuda
225
+ - pyyaml=6.0.1=py311h459d7ec_1
226
+ - pyzmq=26.0.3=py311h08a0b41_0
227
+ - readline=8.2=h8228510_1
228
+ - requests=2.32.3=pyhd8ed1ab_0
229
+ - setuptools=71.0.4=pyhd8ed1ab_0
230
+ - six=1.16.0=pyh6c4a22f_0
231
+ - snappy=1.2.1=ha2e4443_0
232
+ - stack_data=0.6.2=pyhd8ed1ab_0
233
+ - svt-av1=2.1.2=hac33072_0
234
+ - sympy=1.13.0=pypyh2585a3b_103
235
+ - tbb=2021.12.0=h434a139_3
236
+ - tk=8.6.13=noxft_h4845f30_101
237
+ - torchaudio=2.4.0=py311_cu121
238
+ - torchtriton=3.0.0=py311
239
+ - tornado=6.4.1=py311h331c9d8_0
240
+ - traitlets=5.14.3=pyhd8ed1ab_0
241
+ - typing_extensions=4.12.2=pyha770c72_0
242
+ - urllib3=2.2.2=pyhd8ed1ab_1
243
+ - wayland=1.23.0=h5291e77_0
244
+ - wayland-protocols=1.36=hd8ed1ab_0
245
+ - wcwidth=0.2.13=pyhd8ed1ab_0
246
+ - wheel=0.43.0=pyhd8ed1ab_1
247
+ - x264=1!164.3095=h166bdaf_2
248
+ - x265=3.5=h924138e_3
249
+ - xorg-fixesproto=5.0=h7f98852_1002
250
+ - xorg-kbproto=1.0.7=h7f98852_1002
251
+ - xorg-libice=1.1.1=hd590300_0
252
+ - xorg-libsm=1.2.4=h7391055_0
253
+ - xorg-libx11=1.8.9=hb711507_1
254
+ - xorg-libxau=1.0.11=hd590300_0
255
+ - xorg-libxdmcp=1.1.3=h7f98852_0
256
+ - xorg-libxext=1.3.4=h0b41bf4_2
257
+ - xorg-libxfixes=5.0.3=h7f98852_1004
258
+ - xorg-libxrender=0.9.11=hd590300_0
259
+ - xorg-renderproto=0.11.1=h7f98852_1002
260
+ - xorg-xextproto=7.3.0=h0b41bf4_1003
261
+ - xorg-xproto=7.0.31=h7f98852_1007
262
+ - xz=5.2.6=h166bdaf_0
263
+ - yaml=0.2.5=h7f98852_2
264
+ - zeromq=4.3.5=h75354e8_4
265
+ - zipp=3.19.2=pyhd8ed1ab_0
266
+ - zlib=1.3.1=h4ab18f5_1
267
+ - zstandard=0.23.0=py311h5cd10c7_0
268
+ - zstd=1.5.6=ha6fb4c9_0
269
+ - pip:
270
+ - about-time==4.2.1
271
+ - absl-py==2.1.0
272
+ - accelerate==0.34.0
273
+ - aiofiles==23.2.1
274
+ - aiohttp==3.9.5
275
+ - aiohttp-retry==2.8.3
276
+ - aiosignal==1.3.1
277
+ - align-anything==0.0.1.dev0
278
+ - alive-progress==3.1.5
279
+ - amqp==5.2.0
280
+ - annotated-types==0.7.0
281
+ - antlr4-python3-runtime==4.9.3
282
+ - anyio==4.4.0
283
+ - appdirs==1.4.4
284
+ - asyncssh==2.16.0
285
+ - atpublic==5.0
286
+ - attrs==23.2.0
287
+ - audioread==3.0.1
288
+ - backoff==2.2.1
289
+ - billiard==4.2.0
290
+ - boto3==1.35.9
291
+ - botocore==1.35.9
292
+ - cachetools==5.4.0
293
+ - celery==5.4.0
294
+ - cfgv==3.4.0
295
+ - click==8.1.7
296
+ - click-didyoumean==0.3.1
297
+ - click-plugins==1.1.1
298
+ - click-repl==0.3.0
299
+ - cloudpickle==3.0.0
300
+ - cmake==3.30.1
301
+ - colorama==0.4.6
302
+ - commonmark==0.9.1
303
+ - configobj==5.0.8
304
+ - contourpy==1.2.1
305
+ - cryptography==43.0.0
306
+ - cycler==0.12.1
307
+ - dacite==1.6.0
308
+ - dagshub==0.3.35
309
+ - dagshub-annotation-converter==0.1.0
310
+ - dataclasses-json==0.6.7
311
+ - datasets==2.20.0
312
+ - decorator==4.4.2
313
+ - deepspeed==0.14.4
314
+ - dictdiffer==0.9.0
315
+ - diffusers==0.29.2
316
+ - dill==0.3.8
317
+ - diskcache==5.6.3
318
+ - distlib==0.3.8
319
+ - distro==1.9.0
320
+ - dnspython==2.6.1
321
+ - docker-pycreds==0.4.0
322
+ - docstring-parser==0.16
323
+ - dpath==2.2.0
324
+ - dulwich==0.22.1
325
+ - dvc==3.55.1
326
+ - dvc-data==3.16.5
327
+ - dvc-http==2.32.0
328
+ - dvc-objects==5.1.0
329
+ - dvc-render==1.0.2
330
+ - dvc-studio-client==0.21.0
331
+ - dvc-task==0.4.0
332
+ - einops==0.8.0
333
+ - email-validator==2.2.0
334
+ - entrypoints==0.4
335
+ - fastapi==0.111.1
336
+ - fastapi-cli==0.0.4
337
+ - ffmpy==0.3.3
338
+ - fire==0.6.0
339
+ - flatten-dict==0.4.2
340
+ - flufl-lock==8.1.0
341
+ - fonttools==4.53.1
342
+ - frozenlist==1.4.1
343
+ - fsspec==2024.5.0
344
+ - funcy==2.0
345
+ - fusepy==3.0.1
346
+ - gitdb==4.0.11
347
+ - gitpython==3.1.43
348
+ - gql==3.5.0
349
+ - gradio==4.39.0
350
+ - gradio-client==1.1.1
351
+ - gradio-multimodalchatbot==0.0.1
352
+ - grandalf==0.8
353
+ - grapheme==0.6.0
354
+ - graphql-core==3.2.3
355
+ - grpcio==1.65.1
356
+ - gto==1.7.1
357
+ - h11==0.14.0
358
+ - hjson==3.1.0
359
+ - httpcore==1.0.5
360
+ - httptools==0.6.1
361
+ - httpx==0.27.2
362
+ - huggingface-hub==0.24.3
363
+ - hydra-core==1.3.2
364
+ - identify==2.6.0
365
+ - imageio==2.35.1
366
+ - imageio-ffmpeg==0.5.1
367
+ - importlib-resources==6.4.0
368
+ - iniconfig==2.0.0
369
+ - interegular==0.3.3
370
+ - iterative-telemetry==0.0.8
371
+ - jmespath==1.0.1
372
+ - joblib==1.4.2
373
+ - jsonschema==4.23.0
374
+ - jsonschema-specifications==2023.12.1
375
+ - kiwisolver==1.4.5
376
+ - kombu==5.4.0
377
+ - lark==1.1.9
378
+ - lazy-loader==0.4
379
+ - librosa==0.10.2.post1
380
+ - llamafactory==0.8.4.dev0
381
+ - llvmlite==0.43.0
382
+ - lm-format-enforcer==0.10.3
383
+ - lxml==5.3.0
384
+ - markdown==3.6
385
+ - markdown-it-py==3.0.0
386
+ - marshmallow==3.22.0
387
+ - matplotlib==3.9.1
388
+ - mdurl==0.1.2
389
+ - mmsg==0.1.dev14+gbd2b056.d20240803
390
+ - moviepy==1.0.3
391
+ - mpi4py==4.0.0
392
+ - msgpack==1.0.8
393
+ - multidict==6.0.5
394
+ - multiprocess==0.70.16
395
+ - mypy-extensions==1.0.0
396
+ - ninja==1.11.1.1
397
+ - nodeenv==1.9.1
398
+ - numba==0.60.0
399
+ - numpy==1.26.4
400
+ - nvidia-cublas-cu12==12.1.3.1
401
+ - nvidia-cuda-cupti-cu12==12.1.105
402
+ - nvidia-cuda-nvrtc-cu12==12.1.105
403
+ - nvidia-cuda-runtime-cu12==12.1.105
404
+ - nvidia-cudnn-cu12==8.9.2.26
405
+ - nvidia-cufft-cu12==11.0.2.54
406
+ - nvidia-curand-cu12==10.3.2.106
407
+ - nvidia-cusolver-cu12==11.4.5.107
408
+ - nvidia-cusparse-cu12==12.1.0.106
409
+ - nvidia-ml-py==12.535.161
410
+ - nvidia-nccl-cu12==2.20.5
411
+ - nvidia-nvjitlink-cu12==12.5.82
412
+ - nvidia-nvtx-cu12==12.1.105
413
+ - nvitop==1.3.2
414
+ - omegaconf==2.3.0
415
+ - openai==1.37.1
416
+ - optree==0.12.1
417
+ - orjson==3.10.6
418
+ - outlines==0.0.47.dev37+g26e2934
419
+ - pandas==2.2.2
420
+ - pathspec==0.12.1
421
+ - pathvalidate==3.0.0
422
+ - peft==0.12.0
423
+ - platformdirs==3.11.0
424
+ - pluggy==1.5.0
425
+ - pooch==1.8.2
426
+ - pre-commit==3.8.0
427
+ - proglog==0.1.10
428
+ - prometheus-client==0.20.0
429
+ - prometheus-fastapi-instrumentator==7.0.0
430
+ - protobuf==4.25.4
431
+ - py-cpuinfo==9.0.0
432
+ - pyairports==2.1.1
433
+ - pyarrow==17.0.0
434
+ - pyarrow-hotfix==0.6
435
+ - pyav==13.0.0
436
+ - pycountry==24.6.1
437
+ - pydantic==2.8.2
438
+ - pydantic-core==2.20.1
439
+ - pydot==3.0.1
440
+ - pydub==0.25.1
441
+ - pygit2==1.15.1
442
+ - pygtrie==2.5.0
443
+ - pyparsing==3.1.2
444
+ - pytest==8.3.2
445
+ - python-dateutil==2.9.0.post0
446
+ - python-dotenv==1.0.1
447
+ - python-multipart==0.0.9
448
+ - pytz==2024.1
449
+ - ranger-fm==1.9.3
450
+ - ray==2.34.0
451
+ - referencing==0.35.1
452
+ - regex==2024.7.24
453
+ - requests-toolbelt==1.0.0
454
+ - rfc3986==1.5.0
455
+ - rich==13.1.0
456
+ - rpds-py==0.19.1
457
+ - ruamel-yaml==0.18.6
458
+ - ruamel-yaml-clib==0.2.8
459
+ - ruff==0.5.5
460
+ - s3transfer==0.10.2
461
+ - safetensors==0.4.3
462
+ - scikit-learn==1.5.1
463
+ - scipy==1.14.0
464
+ - scmrepo==3.3.7
465
+ - semantic-version==2.10.0
466
+ - semver==3.0.2
467
+ - sentencepiece==0.2.0
468
+ - sentry-sdk==2.11.0
469
+ - setproctitle==1.3.3
470
+ - shellingham==1.5.4
471
+ - shortuuid==1.0.13
472
+ - shtab==1.7.1
473
+ - smmap==5.0.1
474
+ - sniffio==1.3.1
475
+ - soundfile==0.12.1
476
+ - soxr==0.4.0
477
+ - sqltrie==0.11.1
478
+ - sse-starlette==2.1.3
479
+ - starlette==0.37.2
480
+ - tabulate==0.9.0
481
+ - tenacity==8.2.3
482
+ - tensorboard==2.17.0
483
+ - tensorboard-data-server==0.7.2
484
+ - term-image==0.7.2
485
+ - termcolor==2.4.0
486
+ - threadpoolctl==3.5.0
487
+ - tiktoken==0.7.0
488
+ - tokenizers==0.19.1
489
+ - tomlkit==0.12.0
490
+ - torch==2.3.1
491
+ - torchvision==0.18.1
492
+ - tqdm==4.66.4
493
+ - transformers==4.45.0.dev0
494
+ - treelib==1.6.4
495
+ - triton==2.3.1
496
+ - trl==0.9.6
497
+ - typer==0.12.3
498
+ - typing-inspect==0.9.0
499
+ - tyro==0.8.10
500
+ - tzdata==2024.1
501
+ - uvicorn==0.30.3
502
+ - uvloop==0.19.0
503
+ - vine==5.1.0
504
+ - virtualenv==20.26.3
505
+ - vllm==0.5.3.post1
506
+ - vllm-flash-attn==2.5.9.post1
507
+ - voluptuous==0.15.2
508
+ - wandb==0.17.5
509
+ - watchfiles==0.22.0
510
+ - websockets==11.0.3
511
+ - werkzeug==3.0.3
512
+ - xformers==0.0.27
513
+ - xxhash==3.4.1
514
+ - yarl==1.9.4
515
+ - zc-lockfile==3.0.post1
516
+ prefix: /aifs4su/yaodong/miniconda3/envs/hantao_tiv
wandb/run-20240921_103042-1p62y7m7/files/config.yaml ADDED
@@ -0,0 +1,111 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ wandb_version: 1
2
+
3
+ train_cfgs:
4
+ desc: null
5
+ value:
6
+ ds_cfgs: ds_z3_config.json
7
+ epochs: 3
8
+ seed: 42
9
+ per_device_train_batch_size: 1.0
10
+ per_device_eval_batch_size: 1.0
11
+ gradient_accumulation_steps: 1.0
12
+ gradient_checkpointing: true
13
+ learning_rate: 1.0e-06
14
+ lr_scheduler_type: cosine
15
+ lr_warmup_ratio: 0.01
16
+ weight_decay: 0.0
17
+ adam_betas:
18
+ - 0.9
19
+ - 0.95
20
+ bf16: true
21
+ fp16: false
22
+ eval_strategy: epoch
23
+ eval_interval: 10
24
+ regularization: 0.001
25
+ scale_coeff: 0.1
26
+ freeze_mm_proj: false
27
+ freeze_vision_tower: true
28
+ freeze_language_model: false
29
+ data_cfgs:
30
+ desc: null
31
+ value:
32
+ train_datasets: /aifs4su/yaodong/datasets/aaa_dataset/TV2T-preference/extracted
33
+ train_template: NExTQA_preference
34
+ train_size: null
35
+ train_split: train
36
+ train_subset: null
37
+ train_data_files: extracted_preference_1.5k_washed.json
38
+ train_optional_args: []
39
+ eval_datasets: null
40
+ eval_template: null
41
+ eval_size: null
42
+ eval_split: null
43
+ eval_subset: null
44
+ eval_data_files: null
45
+ eval_optional_args: []
46
+ logger_cfgs:
47
+ desc: null
48
+ value:
49
+ log_type: wandb
50
+ log_project: align-anything
51
+ log_run_name: dpo
52
+ output_dir: ../outputs/dpo_tiv2t_1.5k_base
53
+ cache_dir: null
54
+ save_interval: 100000
55
+ model_cfgs:
56
+ desc: null
57
+ value:
58
+ model_name_or_path: /aifs4su/yaodong/models/Qwen2-VL-7B-Instruct
59
+ trust_remote_code: true
60
+ model_max_length: 4096
61
+ special_tokens:
62
+ desc: null
63
+ value: null
64
+ _wandb:
65
+ desc: null
66
+ value:
67
+ python_version: 3.11.9
68
+ cli_version: 0.17.5
69
+ framework: huggingface
70
+ huggingface_version: 4.45.0.dev0
71
+ is_jupyter_run: false
72
+ is_kaggle_kernel: false
73
+ start_time: 1726885842
74
+ t:
75
+ 1:
76
+ - 1
77
+ - 5
78
+ - 11
79
+ - 41
80
+ - 49
81
+ - 51
82
+ - 53
83
+ - 55
84
+ - 71
85
+ - 83
86
+ - 98
87
+ - 105
88
+ 2:
89
+ - 1
90
+ - 5
91
+ - 11
92
+ - 41
93
+ - 49
94
+ - 51
95
+ - 53
96
+ - 55
97
+ - 71
98
+ - 83
99
+ - 98
100
+ - 105
101
+ 3:
102
+ - 13
103
+ - 16
104
+ - 23
105
+ - 61
106
+ 4: 3.11.9
107
+ 5: 0.17.5
108
+ 6: 4.45.0.dev0
109
+ 8:
110
+ - 5
111
+ 13: linux-x86_64
wandb/run-20240921_103042-1p62y7m7/files/output.log ADDED
@@ -0,0 +1,193 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+
2
+ ***** Running training *****
3
+
4
+ Training 1/3 epoch: 0%| | 0/531 [00:00<?, ?it/s]`use_cache=True` is incompatible with gradient checkpointing. Setting `use_cache=False`...
5
+ /aifs4su/yaodong/miniconda3/envs/hantao_tiv/lib/python3.11/site-packages/torch/utils/checkpoint.py:295: FutureWarning: `torch.cpu.amp.autocast(args...)` is deprecated. Please use `torch.amp.autocast('cpu', args...)` instead.
6
+ with torch.enable_grad(), device_autocast_ctx, torch.cpu.amp.autocast(**ctx.cpu_autocast_kwargs): # type: ignore[attr-defined]
7
+
8
+
9
+
10
+
11
+
12
+
13
+
14
+
15
+ Training 1/3 epoch (loss 2.0371): 2%|██▍ | 9/531 [01:25<1:12:46, 8.36s/it]
16
+
17
+
18
+
19
+
20
+
21
+
22
+
23
+
24
+
25
+
26
+ Training 1/3 epoch (loss 0.9317): 4%|█████ | 19/531 [02:44<1:06:03, 7.74s/it]
27
+
28
+
29
+
30
+
31
+
32
+
33
+
34
+
35
+
36
+
37
+ Training 1/3 epoch (loss 0.9305): 5%|███████▋ | 29/531 [04:14<1:13:48, 8.82s/it]
38
+
39
+
40
+
41
+
42
+
43
+
44
+
45
+
46
+
47
+
48
+ Training 1/3 epoch (loss 0.7844): 7%|██████████▎ | 39/531 [05:45<1:13:24, 8.95s/it]
49
+
50
+
51
+
52
+
53
+
54
+
55
+
56
+
57
+
58
+
59
+ Training 1/3 epoch (loss 1.7453): 9%|█████████████ | 49/531 [07:02<1:01:45, 7.69s/it]
60
+
61
+
62
+
63
+
64
+
65
+
66
+
67
+
68
+
69
+
70
+ Training 1/3 epoch (loss 0.4600): 11%|███████████████▉ | 59/531 [08:27<59:54, 7.62s/it]
71
+
72
+
73
+
74
+
75
+
76
+
77
+
78
+
79
+
80
+
81
+ Training 1/3 epoch (loss 0.6254): 13%|██████████████████▌ | 69/531 [09:39<58:09, 7.55s/it]
82
+
83
+
84
+
85
+
86
+
87
+
88
+
89
+
90
+
91
+
92
+
93
+ Training 1/3 epoch (loss 0.8718): 15%|████████████████████▉ | 79/531 [11:15<1:02:01, 8.23s/it]
94
+
95
+
96
+
97
+
98
+
99
+
100
+
101
+
102
+
103
+
104
+
105
+ Training 1/3 epoch (loss 0.5030): 17%|███████████████████████▉ | 89/531 [12:31<56:52, 7.72s/it]
106
+
107
+
108
+
109
+
110
+
111
+
112
+
113
+
114
+
115
+
116
+ Training 1/3 epoch (loss 0.2948): 19%|██████████████████████████▋ | 99/531 [13:59<55:37, 7.73s/it]
117
+
118
+
119
+
120
+
121
+
122
+
123
+
124
+
125
+
126
+
127
+
128
+ Training 1/3 epoch (loss 0.5259): 21%|█████████████████████████████▏ | 109/531 [15:17<58:12, 8.28s/it]
129
+
130
+
131
+
132
+
133
+
134
+
135
+
136
+
137
+
138
+
139
+
140
+ Training 1/3 epoch (loss 1.0179): 22%|███████████████████████████████▊ | 119/531 [16:38<51:04, 7.44s/it]
141
+
142
+
143
+
144
+
145
+
146
+
147
+
148
+
149
+
150
+
151
+ Training 1/3 epoch (loss 0.2882): 24%|██████████████████████████████████▍ | 129/531 [17:50<51:06, 7.63s/it]
152
+
153
+
154
+
155
+
156
+
157
+
158
+
159
+
160
+
161
+
162
+ Training 1/3 epoch (loss 0.6585): 26%|█████████████████████████████████████▏ | 139/531 [19:02<48:02, 7.35s/it]
163
+
164
+
165
+
166
+
167
+
168
+
169
+
170
+
171
+
172
+
173
+
174
+ Training 1/3 epoch (loss 0.2897): 28%|███████████████████████████████████████▎ | 149/531 [20:27<1:01:00, 9.58s/it]
175
+
176
+
177
+
178
+
179
+
180
+
181
+
182
+
183
+
184
+
185
+
186
+ Training 1/3 epoch (loss 0.6085): 30%|██████████████████████████████████████████▌ | 159/531 [21:59<47:04, 7.59s/it]
187
+
188
+
189
+
190
+
191
+
192
+
193
+
wandb/run-20240921_103042-1p62y7m7/files/requirements.txt ADDED
@@ -0,0 +1,325 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ Brotli==1.1.0
2
+ GitPython==3.1.43
3
+ Jinja2==3.1.4
4
+ Markdown==3.6
5
+ MarkupSafe==2.1.5
6
+ PySocks==1.7.1
7
+ PyYAML==6.0.1
8
+ Pygments==2.18.0
9
+ Werkzeug==3.0.3
10
+ about-time==4.2.1
11
+ absl-py==2.1.0
12
+ accelerate==0.34.0
13
+ aiofiles==23.2.1
14
+ aiohttp-retry==2.8.3
15
+ aiohttp==3.9.5
16
+ aiosignal==1.3.1
17
+ align-anything==0.0.1.dev0
18
+ align-anything==0.0.1.dev0
19
+ alive-progress==3.1.5
20
+ amqp==5.2.0
21
+ annotated-types==0.7.0
22
+ antlr4-python3-runtime==4.9.3
23
+ anyio==4.4.0
24
+ appdirs==1.4.4
25
+ asttokens==2.4.1
26
+ asyncssh==2.16.0
27
+ atpublic==5.0
28
+ attrs==23.2.0
29
+ audioread==3.0.1
30
+ autocommand==2.2.2
31
+ backoff==2.2.1
32
+ backports.tarfile==1.2.0
33
+ billiard==4.2.0
34
+ boto3==1.35.9
35
+ botocore==1.35.9
36
+ cachetools==5.4.0
37
+ celery==5.4.0
38
+ certifi==2024.7.4
39
+ cffi==1.16.0
40
+ cfgv==3.4.0
41
+ charset-normalizer==3.3.2
42
+ click-didyoumean==0.3.1
43
+ click-plugins==1.1.1
44
+ click-repl==0.3.0
45
+ click==8.1.7
46
+ cloudpickle==3.0.0
47
+ cmake==3.30.1
48
+ colorama==0.4.6
49
+ comm==0.2.2
50
+ commonmark==0.9.1
51
+ configobj==5.0.8
52
+ contourpy==1.2.1
53
+ cryptography==43.0.0
54
+ cycler==0.12.1
55
+ dacite==1.6.0
56
+ dagshub-annotation-converter==0.1.0
57
+ dagshub==0.3.35
58
+ dataclasses-json==0.6.7
59
+ datasets==2.20.0
60
+ debugpy==1.8.2
61
+ decorator==4.4.2
62
+ deepspeed==0.14.4
63
+ dictdiffer==0.9.0
64
+ diffusers==0.29.2
65
+ dill==0.3.8
66
+ diskcache==5.6.3
67
+ distlib==0.3.8
68
+ distro==1.9.0
69
+ dnspython==2.6.1
70
+ docker-pycreds==0.4.0
71
+ docstring_parser==0.16
72
+ dpath==2.2.0
73
+ dulwich==0.22.1
74
+ dvc-data==3.16.5
75
+ dvc-http==2.32.0
76
+ dvc-objects==5.1.0
77
+ dvc-render==1.0.2
78
+ dvc-studio-client==0.21.0
79
+ dvc-task==0.4.0
80
+ dvc==3.55.1
81
+ einops==0.8.0
82
+ email_validator==2.2.0
83
+ entrypoints==0.4
84
+ exceptiongroup==1.2.2
85
+ executing==2.0.1
86
+ fastapi-cli==0.0.4
87
+ fastapi==0.111.1
88
+ ffmpy==0.3.3
89
+ filelock==3.15.4
90
+ fire==0.6.0
91
+ flatten-dict==0.4.2
92
+ flufl.lock==8.1.0
93
+ fonttools==4.53.1
94
+ frozenlist==1.4.1
95
+ fsspec==2024.5.0
96
+ funcy==2.0
97
+ fusepy==3.0.1
98
+ gitdb==4.0.11
99
+ gmpy2==2.1.5
100
+ gql==3.5.0
101
+ gradio==4.39.0
102
+ gradio_client==1.1.1
103
+ gradio_multimodalchatbot==0.0.1
104
+ grandalf==0.8
105
+ grapheme==0.6.0
106
+ graphql-core==3.2.3
107
+ grpcio==1.65.1
108
+ gto==1.7.1
109
+ h11==0.14.0
110
+ h2==4.1.0
111
+ hjson==3.1.0
112
+ hpack==4.0.0
113
+ httpcore==1.0.5
114
+ httptools==0.6.1
115
+ httpx==0.27.2
116
+ huggingface-hub==0.24.3
117
+ hydra-core==1.3.2
118
+ hyperframe==6.0.1
119
+ identify==2.6.0
120
+ idna==3.7
121
+ imageio-ffmpeg==0.5.1
122
+ imageio==2.35.1
123
+ importlib_metadata==8.0.0
124
+ importlib_metadata==8.2.0
125
+ importlib_resources==6.4.0
126
+ importlib_resources==6.4.0
127
+ inflect==7.3.1
128
+ iniconfig==2.0.0
129
+ interegular==0.3.3
130
+ ipykernel==6.29.5
131
+ ipython==8.26.0
132
+ iterative-telemetry==0.0.8
133
+ jaraco.context==5.3.0
134
+ jaraco.functools==4.0.1
135
+ jaraco.text==3.12.1
136
+ jedi==0.19.1
137
+ jmespath==1.0.1
138
+ joblib==1.4.2
139
+ jsonschema-specifications==2023.12.1
140
+ jsonschema==4.23.0
141
+ jupyter_client==8.6.2
142
+ jupyter_core==5.7.2
143
+ kiwisolver==1.4.5
144
+ kombu==5.4.0
145
+ lark==1.1.9
146
+ lazy_loader==0.4
147
+ librosa==0.10.2.post1
148
+ llamafactory==0.8.4.dev0
149
+ llamafactory==0.8.4.dev0
150
+ llvmlite==0.43.0
151
+ lm-format-enforcer==0.10.3
152
+ lxml==5.3.0
153
+ markdown-it-py==3.0.0
154
+ marshmallow==3.22.0
155
+ matplotlib-inline==0.1.7
156
+ matplotlib==3.9.1
157
+ mdurl==0.1.2
158
+ mmsg==0.1.dev14+gbd2b056.d20240803
159
+ more-itertools==10.3.0
160
+ moviepy==1.0.3
161
+ mpi4py==4.0.0
162
+ mpmath==1.3.0
163
+ msgpack==1.0.8
164
+ multidict==6.0.5
165
+ multiprocess==0.70.16
166
+ mypy-extensions==1.0.0
167
+ nest_asyncio==1.6.0
168
+ networkx==3.3
169
+ ninja==1.11.1.1
170
+ nodeenv==1.9.1
171
+ numba==0.60.0
172
+ numpy==1.26.4
173
+ nvidia-cublas-cu12==12.1.3.1
174
+ nvidia-cuda-cupti-cu12==12.1.105
175
+ nvidia-cuda-nvrtc-cu12==12.1.105
176
+ nvidia-cuda-runtime-cu12==12.1.105
177
+ nvidia-cudnn-cu12==8.9.2.26
178
+ nvidia-cufft-cu12==11.0.2.54
179
+ nvidia-curand-cu12==10.3.2.106
180
+ nvidia-cusolver-cu12==11.4.5.107
181
+ nvidia-cusparse-cu12==12.1.0.106
182
+ nvidia-ml-py==12.535.161
183
+ nvidia-nccl-cu12==2.20.5
184
+ nvidia-nvjitlink-cu12==12.5.82
185
+ nvidia-nvtx-cu12==12.1.105
186
+ nvitop==1.3.2
187
+ omegaconf==2.3.0
188
+ openai==1.37.1
189
+ optree==0.12.1
190
+ ordered-set==4.1.0
191
+ orjson==3.10.6
192
+ outlines==0.0.47.dev37+g26e2934
193
+ packaging==24.1
194
+ packaging==24.1
195
+ pandas==2.2.2
196
+ parso==0.8.4
197
+ pathspec==0.12.1
198
+ pathvalidate==3.0.0
199
+ peft==0.12.0
200
+ pexpect==4.9.0
201
+ pickleshare==0.7.5
202
+ pillow==10.4.0
203
+ pip==24.0
204
+ platformdirs==3.11.0
205
+ platformdirs==4.2.2
206
+ pluggy==1.5.0
207
+ pooch==1.8.2
208
+ pre-commit==3.8.0
209
+ proglog==0.1.10
210
+ prometheus-fastapi-instrumentator==7.0.0
211
+ prometheus_client==0.20.0
212
+ prompt_toolkit==3.0.47
213
+ protobuf==4.25.4
214
+ psutil==6.0.0
215
+ ptyprocess==0.7.0
216
+ pure_eval==0.2.3
217
+ py-cpuinfo==9.0.0
218
+ pyairports==2.1.1
219
+ pyarrow-hotfix==0.6
220
+ pyarrow==17.0.0
221
+ pyav==13.0.0
222
+ pycountry==24.6.1
223
+ pycparser==2.22
224
+ pydantic==2.8.2
225
+ pydantic_core==2.20.1
226
+ pydot==3.0.1
227
+ pydub==0.25.1
228
+ pygit2==1.15.1
229
+ pygtrie==2.5.0
230
+ pyparsing==3.1.2
231
+ pytest==8.3.2
232
+ python-dateutil==2.9.0
233
+ python-dateutil==2.9.0.post0
234
+ python-dotenv==1.0.1
235
+ python-multipart==0.0.9
236
+ pytz==2024.1
237
+ pyzmq==26.0.3
238
+ ranger-fm==1.9.3
239
+ ray==2.34.0
240
+ referencing==0.35.1
241
+ regex==2024.7.24
242
+ requests-toolbelt==1.0.0
243
+ requests==2.32.3
244
+ rfc3986==1.5.0
245
+ rich==13.1.0
246
+ rpds-py==0.19.1
247
+ ruamel.yaml.clib==0.2.8
248
+ ruamel.yaml==0.18.6
249
+ ruff==0.5.5
250
+ s3transfer==0.10.2
251
+ safetensors==0.4.3
252
+ scikit-learn==1.5.1
253
+ scipy==1.14.0
254
+ scmrepo==3.3.7
255
+ semantic-version==2.10.0
256
+ semver==3.0.2
257
+ sentencepiece==0.2.0
258
+ sentry-sdk==2.11.0
259
+ setproctitle==1.3.3
260
+ setuptools==71.0.4
261
+ shellingham==1.5.4
262
+ shortuuid==1.0.13
263
+ shtab==1.7.1
264
+ six==1.16.0
265
+ smmap==5.0.1
266
+ sniffio==1.3.1
267
+ soundfile==0.12.1
268
+ soxr==0.4.0
269
+ sqltrie==0.11.1
270
+ sse-starlette==2.1.3
271
+ stack-data==0.6.2
272
+ starlette==0.37.2
273
+ sympy==1.13.0
274
+ tabulate==0.9.0
275
+ tenacity==8.2.3
276
+ tensorboard-data-server==0.7.2
277
+ tensorboard==2.17.0
278
+ term-image==0.7.2
279
+ termcolor==2.4.0
280
+ threadpoolctl==3.5.0
281
+ tiktoken==0.7.0
282
+ tokenizers==0.19.1
283
+ tomli==2.0.1
284
+ tomlkit==0.12.0
285
+ torch==2.3.1
286
+ torch==2.4.0
287
+ torchaudio==2.4.0
288
+ torchvision==0.18.1
289
+ torchvision==0.19.0
290
+ tornado==6.4.1
291
+ tqdm==4.66.4
292
+ traitlets==5.14.3
293
+ transformers==4.45.0.dev0
294
+ treelib==1.6.4
295
+ triton==2.3.1
296
+ triton==3.0.0
297
+ trl==0.9.6
298
+ typeguard==4.3.0
299
+ typer==0.12.3
300
+ typing-inspect==0.9.0
301
+ typing_extensions==4.12.2
302
+ typing_extensions==4.12.2
303
+ tyro==0.8.10
304
+ tzdata==2024.1
305
+ urllib3==2.2.2
306
+ uvicorn==0.30.3
307
+ uvloop==0.19.0
308
+ vine==5.1.0
309
+ virtualenv==20.26.3
310
+ vllm-flash-attn==2.5.9.post1
311
+ vllm==0.5.3.post1
312
+ voluptuous==0.15.2
313
+ wandb==0.17.5
314
+ watchfiles==0.22.0
315
+ wcwidth==0.2.13
316
+ websockets==11.0.3
317
+ wheel==0.43.0
318
+ wheel==0.43.0
319
+ xformers==0.0.27
320
+ xxhash==3.4.1
321
+ yarl==1.9.4
322
+ zc.lockfile==3.0.post1
323
+ zipp==3.19.2
324
+ zipp==3.19.2
325
+ zstandard==0.23.0
wandb/run-20240921_103042-1p62y7m7/files/wandb-metadata.json ADDED
@@ -0,0 +1,1215 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "os": "Linux-5.15.0-1040-nvidia-x86_64-with-glibc2.35",
3
+ "python": "3.11.9",
4
+ "heartbeatAt": "2024-09-21T02:30:43.242497",
5
+ "startedAt": "2024-09-21T02:30:42.382544",
6
+ "docker": null,
7
+ "cuda": null,
8
+ "args": [
9
+ "--local_rank=0",
10
+ "--model_name_or_path",
11
+ "/aifs4su/yaodong/models/Qwen2-VL-7B-Instruct",
12
+ "--train_datasets",
13
+ "/aifs4su/yaodong/datasets/aaa_dataset/TV2T-preference/extracted",
14
+ "--output_dir",
15
+ "../outputs/dpo_tiv2t_1.5k_base",
16
+ "--train_data_files",
17
+ "extracted_preference_1.5k_washed.json",
18
+ "--train_template",
19
+ "NExTQA_preference",
20
+ "--train_split",
21
+ "train",
22
+ "--per_device_train_batch_size",
23
+ "1",
24
+ "--per_device_eval_batch_size",
25
+ "1",
26
+ "--gradient_accumulation_steps",
27
+ "1"
28
+ ],
29
+ "state": "running",
30
+ "program": "-m align_anything.trainers.tiv_to_t.dpo",
31
+ "codePathLocal": null,
32
+ "git": {
33
+ "remote": "git@github.com-hantao:htlou/align-anything.git",
34
+ "commit": "9eff99b0ee34f7265b8a2e1824650634c898f654"
35
+ },
36
+ "email": "2200017789@stu.pku.edu.cn",
37
+ "root": "/aifs4su/yaodong/projects/hantao/dev_cham/align-anything",
38
+ "host": "dgx-119",
39
+ "username": "yangyaodong",
40
+ "executable": "/aifs4su/yaodong/miniconda3/envs/hantao_tiv/bin/python3.11",
41
+ "cpu_count": 112,
42
+ "cpu_count_logical": 224,
43
+ "cpu_freq": {
44
+ "current": 2064.2638660714288,
45
+ "min": 800.0,
46
+ "max": 3800.0
47
+ },
48
+ "cpu_freq_per_core": [
49
+ {
50
+ "current": 2000.0,
51
+ "min": 800.0,
52
+ "max": 3800.0
53
+ },
54
+ {
55
+ "current": 2000.0,
56
+ "min": 800.0,
57
+ "max": 3800.0
58
+ },
59
+ {
60
+ "current": 2000.0,
61
+ "min": 800.0,
62
+ "max": 3800.0
63
+ },
64
+ {
65
+ "current": 2000.0,
66
+ "min": 800.0,
67
+ "max": 3800.0
68
+ },
69
+ {
70
+ "current": 2000.0,
71
+ "min": 800.0,
72
+ "max": 3800.0
73
+ },
74
+ {
75
+ "current": 2000.0,
76
+ "min": 800.0,
77
+ "max": 3800.0
78
+ },
79
+ {
80
+ "current": 2000.0,
81
+ "min": 800.0,
82
+ "max": 3800.0
83
+ },
84
+ {
85
+ "current": 2000.0,
86
+ "min": 800.0,
87
+ "max": 3800.0
88
+ },
89
+ {
90
+ "current": 2000.0,
91
+ "min": 800.0,
92
+ "max": 3800.0
93
+ },
94
+ {
95
+ "current": 2000.0,
96
+ "min": 800.0,
97
+ "max": 3800.0
98
+ },
99
+ {
100
+ "current": 2000.0,
101
+ "min": 800.0,
102
+ "max": 3800.0
103
+ },
104
+ {
105
+ "current": 2000.0,
106
+ "min": 800.0,
107
+ "max": 3800.0
108
+ },
109
+ {
110
+ "current": 2000.0,
111
+ "min": 800.0,
112
+ "max": 3800.0
113
+ },
114
+ {
115
+ "current": 2000.0,
116
+ "min": 800.0,
117
+ "max": 3800.0
118
+ },
119
+ {
120
+ "current": 2000.0,
121
+ "min": 800.0,
122
+ "max": 3800.0
123
+ },
124
+ {
125
+ "current": 2000.0,
126
+ "min": 800.0,
127
+ "max": 3800.0
128
+ },
129
+ {
130
+ "current": 2000.0,
131
+ "min": 800.0,
132
+ "max": 3800.0
133
+ },
134
+ {
135
+ "current": 2000.0,
136
+ "min": 800.0,
137
+ "max": 3800.0
138
+ },
139
+ {
140
+ "current": 2000.0,
141
+ "min": 800.0,
142
+ "max": 3800.0
143
+ },
144
+ {
145
+ "current": 2000.0,
146
+ "min": 800.0,
147
+ "max": 3800.0
148
+ },
149
+ {
150
+ "current": 2000.0,
151
+ "min": 800.0,
152
+ "max": 3800.0
153
+ },
154
+ {
155
+ "current": 2000.0,
156
+ "min": 800.0,
157
+ "max": 3800.0
158
+ },
159
+ {
160
+ "current": 2000.0,
161
+ "min": 800.0,
162
+ "max": 3800.0
163
+ },
164
+ {
165
+ "current": 2000.0,
166
+ "min": 800.0,
167
+ "max": 3800.0
168
+ },
169
+ {
170
+ "current": 2000.0,
171
+ "min": 800.0,
172
+ "max": 3800.0
173
+ },
174
+ {
175
+ "current": 2000.0,
176
+ "min": 800.0,
177
+ "max": 3800.0
178
+ },
179
+ {
180
+ "current": 2000.0,
181
+ "min": 800.0,
182
+ "max": 3800.0
183
+ },
184
+ {
185
+ "current": 2000.0,
186
+ "min": 800.0,
187
+ "max": 3800.0
188
+ },
189
+ {
190
+ "current": 2000.0,
191
+ "min": 800.0,
192
+ "max": 3800.0
193
+ },
194
+ {
195
+ "current": 2000.0,
196
+ "min": 800.0,
197
+ "max": 3800.0
198
+ },
199
+ {
200
+ "current": 2000.0,
201
+ "min": 800.0,
202
+ "max": 3800.0
203
+ },
204
+ {
205
+ "current": 2000.0,
206
+ "min": 800.0,
207
+ "max": 3800.0
208
+ },
209
+ {
210
+ "current": 2000.0,
211
+ "min": 800.0,
212
+ "max": 3800.0
213
+ },
214
+ {
215
+ "current": 2000.0,
216
+ "min": 800.0,
217
+ "max": 3800.0
218
+ },
219
+ {
220
+ "current": 2000.0,
221
+ "min": 800.0,
222
+ "max": 3800.0
223
+ },
224
+ {
225
+ "current": 2000.0,
226
+ "min": 800.0,
227
+ "max": 3800.0
228
+ },
229
+ {
230
+ "current": 2000.0,
231
+ "min": 800.0,
232
+ "max": 3800.0
233
+ },
234
+ {
235
+ "current": 2000.0,
236
+ "min": 800.0,
237
+ "max": 3800.0
238
+ },
239
+ {
240
+ "current": 2000.0,
241
+ "min": 800.0,
242
+ "max": 3800.0
243
+ },
244
+ {
245
+ "current": 2000.0,
246
+ "min": 800.0,
247
+ "max": 3800.0
248
+ },
249
+ {
250
+ "current": 2000.0,
251
+ "min": 800.0,
252
+ "max": 3800.0
253
+ },
254
+ {
255
+ "current": 2000.0,
256
+ "min": 800.0,
257
+ "max": 3800.0
258
+ },
259
+ {
260
+ "current": 2000.0,
261
+ "min": 800.0,
262
+ "max": 3800.0
263
+ },
264
+ {
265
+ "current": 2000.0,
266
+ "min": 800.0,
267
+ "max": 3800.0
268
+ },
269
+ {
270
+ "current": 2000.0,
271
+ "min": 800.0,
272
+ "max": 3800.0
273
+ },
274
+ {
275
+ "current": 2000.0,
276
+ "min": 800.0,
277
+ "max": 3800.0
278
+ },
279
+ {
280
+ "current": 2000.0,
281
+ "min": 800.0,
282
+ "max": 3800.0
283
+ },
284
+ {
285
+ "current": 2000.0,
286
+ "min": 800.0,
287
+ "max": 3800.0
288
+ },
289
+ {
290
+ "current": 2000.0,
291
+ "min": 800.0,
292
+ "max": 3800.0
293
+ },
294
+ {
295
+ "current": 2000.0,
296
+ "min": 800.0,
297
+ "max": 3800.0
298
+ },
299
+ {
300
+ "current": 2000.0,
301
+ "min": 800.0,
302
+ "max": 3800.0
303
+ },
304
+ {
305
+ "current": 2000.0,
306
+ "min": 800.0,
307
+ "max": 3800.0
308
+ },
309
+ {
310
+ "current": 2000.0,
311
+ "min": 800.0,
312
+ "max": 3800.0
313
+ },
314
+ {
315
+ "current": 2000.0,
316
+ "min": 800.0,
317
+ "max": 3800.0
318
+ },
319
+ {
320
+ "current": 2000.0,
321
+ "min": 800.0,
322
+ "max": 3800.0
323
+ },
324
+ {
325
+ "current": 2000.0,
326
+ "min": 800.0,
327
+ "max": 3800.0
328
+ },
329
+ {
330
+ "current": 2000.0,
331
+ "min": 800.0,
332
+ "max": 3800.0
333
+ },
334
+ {
335
+ "current": 2000.0,
336
+ "min": 800.0,
337
+ "max": 3800.0
338
+ },
339
+ {
340
+ "current": 2000.0,
341
+ "min": 800.0,
342
+ "max": 3800.0
343
+ },
344
+ {
345
+ "current": 3800.003,
346
+ "min": 800.0,
347
+ "max": 3800.0
348
+ },
349
+ {
350
+ "current": 3800.003,
351
+ "min": 800.0,
352
+ "max": 3800.0
353
+ },
354
+ {
355
+ "current": 3800.0,
356
+ "min": 800.0,
357
+ "max": 3800.0
358
+ },
359
+ {
360
+ "current": 3800.0,
361
+ "min": 800.0,
362
+ "max": 3800.0
363
+ },
364
+ {
365
+ "current": 3800.0,
366
+ "min": 800.0,
367
+ "max": 3800.0
368
+ },
369
+ {
370
+ "current": 2000.0,
371
+ "min": 800.0,
372
+ "max": 3800.0
373
+ },
374
+ {
375
+ "current": 2000.0,
376
+ "min": 800.0,
377
+ "max": 3800.0
378
+ },
379
+ {
380
+ "current": 2000.0,
381
+ "min": 800.0,
382
+ "max": 3800.0
383
+ },
384
+ {
385
+ "current": 2000.0,
386
+ "min": 800.0,
387
+ "max": 3800.0
388
+ },
389
+ {
390
+ "current": 2000.0,
391
+ "min": 800.0,
392
+ "max": 3800.0
393
+ },
394
+ {
395
+ "current": 2000.0,
396
+ "min": 800.0,
397
+ "max": 3800.0
398
+ },
399
+ {
400
+ "current": 2000.0,
401
+ "min": 800.0,
402
+ "max": 3800.0
403
+ },
404
+ {
405
+ "current": 2000.0,
406
+ "min": 800.0,
407
+ "max": 3800.0
408
+ },
409
+ {
410
+ "current": 2000.0,
411
+ "min": 800.0,
412
+ "max": 3800.0
413
+ },
414
+ {
415
+ "current": 2000.0,
416
+ "min": 800.0,
417
+ "max": 3800.0
418
+ },
419
+ {
420
+ "current": 2000.0,
421
+ "min": 800.0,
422
+ "max": 3800.0
423
+ },
424
+ {
425
+ "current": 2000.0,
426
+ "min": 800.0,
427
+ "max": 3800.0
428
+ },
429
+ {
430
+ "current": 2000.0,
431
+ "min": 800.0,
432
+ "max": 3800.0
433
+ },
434
+ {
435
+ "current": 2000.0,
436
+ "min": 800.0,
437
+ "max": 3800.0
438
+ },
439
+ {
440
+ "current": 2000.0,
441
+ "min": 800.0,
442
+ "max": 3800.0
443
+ },
444
+ {
445
+ "current": 2000.0,
446
+ "min": 800.0,
447
+ "max": 3800.0
448
+ },
449
+ {
450
+ "current": 2000.0,
451
+ "min": 800.0,
452
+ "max": 3800.0
453
+ },
454
+ {
455
+ "current": 2000.0,
456
+ "min": 800.0,
457
+ "max": 3800.0
458
+ },
459
+ {
460
+ "current": 2000.0,
461
+ "min": 800.0,
462
+ "max": 3800.0
463
+ },
464
+ {
465
+ "current": 2000.0,
466
+ "min": 800.0,
467
+ "max": 3800.0
468
+ },
469
+ {
470
+ "current": 2000.0,
471
+ "min": 800.0,
472
+ "max": 3800.0
473
+ },
474
+ {
475
+ "current": 2000.0,
476
+ "min": 800.0,
477
+ "max": 3800.0
478
+ },
479
+ {
480
+ "current": 2000.0,
481
+ "min": 800.0,
482
+ "max": 3800.0
483
+ },
484
+ {
485
+ "current": 2000.0,
486
+ "min": 800.0,
487
+ "max": 3800.0
488
+ },
489
+ {
490
+ "current": 2000.0,
491
+ "min": 800.0,
492
+ "max": 3800.0
493
+ },
494
+ {
495
+ "current": 2000.0,
496
+ "min": 800.0,
497
+ "max": 3800.0
498
+ },
499
+ {
500
+ "current": 2000.0,
501
+ "min": 800.0,
502
+ "max": 3800.0
503
+ },
504
+ {
505
+ "current": 2000.0,
506
+ "min": 800.0,
507
+ "max": 3800.0
508
+ },
509
+ {
510
+ "current": 2000.0,
511
+ "min": 800.0,
512
+ "max": 3800.0
513
+ },
514
+ {
515
+ "current": 2000.0,
516
+ "min": 800.0,
517
+ "max": 3800.0
518
+ },
519
+ {
520
+ "current": 2000.0,
521
+ "min": 800.0,
522
+ "max": 3800.0
523
+ },
524
+ {
525
+ "current": 2000.0,
526
+ "min": 800.0,
527
+ "max": 3800.0
528
+ },
529
+ {
530
+ "current": 2000.0,
531
+ "min": 800.0,
532
+ "max": 3800.0
533
+ },
534
+ {
535
+ "current": 2000.0,
536
+ "min": 800.0,
537
+ "max": 3800.0
538
+ },
539
+ {
540
+ "current": 2000.0,
541
+ "min": 800.0,
542
+ "max": 3800.0
543
+ },
544
+ {
545
+ "current": 2000.0,
546
+ "min": 800.0,
547
+ "max": 3800.0
548
+ },
549
+ {
550
+ "current": 2000.0,
551
+ "min": 800.0,
552
+ "max": 3800.0
553
+ },
554
+ {
555
+ "current": 2000.0,
556
+ "min": 800.0,
557
+ "max": 3800.0
558
+ },
559
+ {
560
+ "current": 2000.0,
561
+ "min": 800.0,
562
+ "max": 3800.0
563
+ },
564
+ {
565
+ "current": 2000.0,
566
+ "min": 800.0,
567
+ "max": 3800.0
568
+ },
569
+ {
570
+ "current": 2000.0,
571
+ "min": 800.0,
572
+ "max": 3800.0
573
+ },
574
+ {
575
+ "current": 2000.0,
576
+ "min": 800.0,
577
+ "max": 3800.0
578
+ },
579
+ {
580
+ "current": 3800.0,
581
+ "min": 800.0,
582
+ "max": 3800.0
583
+ },
584
+ {
585
+ "current": 2000.0,
586
+ "min": 800.0,
587
+ "max": 3800.0
588
+ },
589
+ {
590
+ "current": 2000.0,
591
+ "min": 800.0,
592
+ "max": 3800.0
593
+ },
594
+ {
595
+ "current": 2000.0,
596
+ "min": 800.0,
597
+ "max": 3800.0
598
+ },
599
+ {
600
+ "current": 2000.0,
601
+ "min": 800.0,
602
+ "max": 3800.0
603
+ },
604
+ {
605
+ "current": 2000.0,
606
+ "min": 800.0,
607
+ "max": 3800.0
608
+ },
609
+ {
610
+ "current": 2000.0,
611
+ "min": 800.0,
612
+ "max": 3800.0
613
+ },
614
+ {
615
+ "current": 2000.0,
616
+ "min": 800.0,
617
+ "max": 3800.0
618
+ },
619
+ {
620
+ "current": 2000.0,
621
+ "min": 800.0,
622
+ "max": 3800.0
623
+ },
624
+ {
625
+ "current": 2000.0,
626
+ "min": 800.0,
627
+ "max": 3800.0
628
+ },
629
+ {
630
+ "current": 2000.0,
631
+ "min": 800.0,
632
+ "max": 3800.0
633
+ },
634
+ {
635
+ "current": 2000.0,
636
+ "min": 800.0,
637
+ "max": 3800.0
638
+ },
639
+ {
640
+ "current": 2000.0,
641
+ "min": 800.0,
642
+ "max": 3800.0
643
+ },
644
+ {
645
+ "current": 2000.0,
646
+ "min": 800.0,
647
+ "max": 3800.0
648
+ },
649
+ {
650
+ "current": 2000.0,
651
+ "min": 800.0,
652
+ "max": 3800.0
653
+ },
654
+ {
655
+ "current": 3799.772,
656
+ "min": 800.0,
657
+ "max": 3800.0
658
+ },
659
+ {
660
+ "current": 2000.0,
661
+ "min": 800.0,
662
+ "max": 3800.0
663
+ },
664
+ {
665
+ "current": 2000.0,
666
+ "min": 800.0,
667
+ "max": 3800.0
668
+ },
669
+ {
670
+ "current": 2000.0,
671
+ "min": 800.0,
672
+ "max": 3800.0
673
+ },
674
+ {
675
+ "current": 2000.0,
676
+ "min": 800.0,
677
+ "max": 3800.0
678
+ },
679
+ {
680
+ "current": 2000.0,
681
+ "min": 800.0,
682
+ "max": 3800.0
683
+ },
684
+ {
685
+ "current": 2000.0,
686
+ "min": 800.0,
687
+ "max": 3800.0
688
+ },
689
+ {
690
+ "current": 3799.406,
691
+ "min": 800.0,
692
+ "max": 3800.0
693
+ },
694
+ {
695
+ "current": 2000.0,
696
+ "min": 800.0,
697
+ "max": 3800.0
698
+ },
699
+ {
700
+ "current": 2000.0,
701
+ "min": 800.0,
702
+ "max": 3800.0
703
+ },
704
+ {
705
+ "current": 2000.0,
706
+ "min": 800.0,
707
+ "max": 3800.0
708
+ },
709
+ {
710
+ "current": 2000.0,
711
+ "min": 800.0,
712
+ "max": 3800.0
713
+ },
714
+ {
715
+ "current": 2000.0,
716
+ "min": 800.0,
717
+ "max": 3800.0
718
+ },
719
+ {
720
+ "current": 2000.0,
721
+ "min": 800.0,
722
+ "max": 3800.0
723
+ },
724
+ {
725
+ "current": 2000.0,
726
+ "min": 800.0,
727
+ "max": 3800.0
728
+ },
729
+ {
730
+ "current": 2000.0,
731
+ "min": 800.0,
732
+ "max": 3800.0
733
+ },
734
+ {
735
+ "current": 2000.0,
736
+ "min": 800.0,
737
+ "max": 3800.0
738
+ },
739
+ {
740
+ "current": 2000.0,
741
+ "min": 800.0,
742
+ "max": 3800.0
743
+ },
744
+ {
745
+ "current": 2000.0,
746
+ "min": 800.0,
747
+ "max": 3800.0
748
+ },
749
+ {
750
+ "current": 2000.0,
751
+ "min": 800.0,
752
+ "max": 3800.0
753
+ },
754
+ {
755
+ "current": 2000.0,
756
+ "min": 800.0,
757
+ "max": 3800.0
758
+ },
759
+ {
760
+ "current": 2000.0,
761
+ "min": 800.0,
762
+ "max": 3800.0
763
+ },
764
+ {
765
+ "current": 2000.0,
766
+ "min": 800.0,
767
+ "max": 3800.0
768
+ },
769
+ {
770
+ "current": 2000.0,
771
+ "min": 800.0,
772
+ "max": 3800.0
773
+ },
774
+ {
775
+ "current": 2000.0,
776
+ "min": 800.0,
777
+ "max": 3800.0
778
+ },
779
+ {
780
+ "current": 2000.0,
781
+ "min": 800.0,
782
+ "max": 3800.0
783
+ },
784
+ {
785
+ "current": 2000.0,
786
+ "min": 800.0,
787
+ "max": 3800.0
788
+ },
789
+ {
790
+ "current": 2000.0,
791
+ "min": 800.0,
792
+ "max": 3800.0
793
+ },
794
+ {
795
+ "current": 2000.0,
796
+ "min": 800.0,
797
+ "max": 3800.0
798
+ },
799
+ {
800
+ "current": 2000.0,
801
+ "min": 800.0,
802
+ "max": 3800.0
803
+ },
804
+ {
805
+ "current": 2000.0,
806
+ "min": 800.0,
807
+ "max": 3800.0
808
+ },
809
+ {
810
+ "current": 2000.0,
811
+ "min": 800.0,
812
+ "max": 3800.0
813
+ },
814
+ {
815
+ "current": 2000.0,
816
+ "min": 800.0,
817
+ "max": 3800.0
818
+ },
819
+ {
820
+ "current": 2000.0,
821
+ "min": 800.0,
822
+ "max": 3800.0
823
+ },
824
+ {
825
+ "current": 2000.0,
826
+ "min": 800.0,
827
+ "max": 3800.0
828
+ },
829
+ {
830
+ "current": 2000.0,
831
+ "min": 800.0,
832
+ "max": 3800.0
833
+ },
834
+ {
835
+ "current": 2000.0,
836
+ "min": 800.0,
837
+ "max": 3800.0
838
+ },
839
+ {
840
+ "current": 2000.0,
841
+ "min": 800.0,
842
+ "max": 3800.0
843
+ },
844
+ {
845
+ "current": 2000.0,
846
+ "min": 800.0,
847
+ "max": 3800.0
848
+ },
849
+ {
850
+ "current": 2000.0,
851
+ "min": 800.0,
852
+ "max": 3800.0
853
+ },
854
+ {
855
+ "current": 2000.0,
856
+ "min": 800.0,
857
+ "max": 3800.0
858
+ },
859
+ {
860
+ "current": 2000.0,
861
+ "min": 800.0,
862
+ "max": 3800.0
863
+ },
864
+ {
865
+ "current": 2000.0,
866
+ "min": 800.0,
867
+ "max": 3800.0
868
+ },
869
+ {
870
+ "current": 2000.0,
871
+ "min": 800.0,
872
+ "max": 3800.0
873
+ },
874
+ {
875
+ "current": 2000.0,
876
+ "min": 800.0,
877
+ "max": 3800.0
878
+ },
879
+ {
880
+ "current": 2000.0,
881
+ "min": 800.0,
882
+ "max": 3800.0
883
+ },
884
+ {
885
+ "current": 2000.0,
886
+ "min": 800.0,
887
+ "max": 3800.0
888
+ },
889
+ {
890
+ "current": 2000.0,
891
+ "min": 800.0,
892
+ "max": 3800.0
893
+ },
894
+ {
895
+ "current": 2000.0,
896
+ "min": 800.0,
897
+ "max": 3800.0
898
+ },
899
+ {
900
+ "current": 2000.0,
901
+ "min": 800.0,
902
+ "max": 3800.0
903
+ },
904
+ {
905
+ "current": 2000.0,
906
+ "min": 800.0,
907
+ "max": 3800.0
908
+ },
909
+ {
910
+ "current": 2000.0,
911
+ "min": 800.0,
912
+ "max": 3800.0
913
+ },
914
+ {
915
+ "current": 2000.0,
916
+ "min": 800.0,
917
+ "max": 3800.0
918
+ },
919
+ {
920
+ "current": 2000.0,
921
+ "min": 800.0,
922
+ "max": 3800.0
923
+ },
924
+ {
925
+ "current": 2000.0,
926
+ "min": 800.0,
927
+ "max": 3800.0
928
+ },
929
+ {
930
+ "current": 2000.0,
931
+ "min": 800.0,
932
+ "max": 3800.0
933
+ },
934
+ {
935
+ "current": 2000.0,
936
+ "min": 800.0,
937
+ "max": 3800.0
938
+ },
939
+ {
940
+ "current": 2000.0,
941
+ "min": 800.0,
942
+ "max": 3800.0
943
+ },
944
+ {
945
+ "current": 2000.0,
946
+ "min": 800.0,
947
+ "max": 3800.0
948
+ },
949
+ {
950
+ "current": 2000.0,
951
+ "min": 800.0,
952
+ "max": 3800.0
953
+ },
954
+ {
955
+ "current": 2000.0,
956
+ "min": 800.0,
957
+ "max": 3800.0
958
+ },
959
+ {
960
+ "current": 3800.0,
961
+ "min": 800.0,
962
+ "max": 3800.0
963
+ },
964
+ {
965
+ "current": 2000.0,
966
+ "min": 800.0,
967
+ "max": 3800.0
968
+ },
969
+ {
970
+ "current": 2000.0,
971
+ "min": 800.0,
972
+ "max": 3800.0
973
+ },
974
+ {
975
+ "current": 2000.0,
976
+ "min": 800.0,
977
+ "max": 3800.0
978
+ },
979
+ {
980
+ "current": 2000.0,
981
+ "min": 800.0,
982
+ "max": 3800.0
983
+ },
984
+ {
985
+ "current": 2000.0,
986
+ "min": 800.0,
987
+ "max": 3800.0
988
+ },
989
+ {
990
+ "current": 2000.0,
991
+ "min": 800.0,
992
+ "max": 3800.0
993
+ },
994
+ {
995
+ "current": 2000.0,
996
+ "min": 800.0,
997
+ "max": 3800.0
998
+ },
999
+ {
1000
+ "current": 2000.0,
1001
+ "min": 800.0,
1002
+ "max": 3800.0
1003
+ },
1004
+ {
1005
+ "current": 2000.0,
1006
+ "min": 800.0,
1007
+ "max": 3800.0
1008
+ },
1009
+ {
1010
+ "current": 2000.0,
1011
+ "min": 800.0,
1012
+ "max": 3800.0
1013
+ },
1014
+ {
1015
+ "current": 2000.0,
1016
+ "min": 800.0,
1017
+ "max": 3800.0
1018
+ },
1019
+ {
1020
+ "current": 2000.0,
1021
+ "min": 800.0,
1022
+ "max": 3800.0
1023
+ },
1024
+ {
1025
+ "current": 2000.0,
1026
+ "min": 800.0,
1027
+ "max": 3800.0
1028
+ },
1029
+ {
1030
+ "current": 2000.0,
1031
+ "min": 800.0,
1032
+ "max": 3800.0
1033
+ },
1034
+ {
1035
+ "current": 2000.0,
1036
+ "min": 800.0,
1037
+ "max": 3800.0
1038
+ },
1039
+ {
1040
+ "current": 2000.0,
1041
+ "min": 800.0,
1042
+ "max": 3800.0
1043
+ },
1044
+ {
1045
+ "current": 2000.0,
1046
+ "min": 800.0,
1047
+ "max": 3800.0
1048
+ },
1049
+ {
1050
+ "current": 2000.0,
1051
+ "min": 800.0,
1052
+ "max": 3800.0
1053
+ },
1054
+ {
1055
+ "current": 2000.0,
1056
+ "min": 800.0,
1057
+ "max": 3800.0
1058
+ },
1059
+ {
1060
+ "current": 2000.0,
1061
+ "min": 800.0,
1062
+ "max": 3800.0
1063
+ },
1064
+ {
1065
+ "current": 2000.0,
1066
+ "min": 800.0,
1067
+ "max": 3800.0
1068
+ },
1069
+ {
1070
+ "current": 2000.0,
1071
+ "min": 800.0,
1072
+ "max": 3800.0
1073
+ },
1074
+ {
1075
+ "current": 2000.0,
1076
+ "min": 800.0,
1077
+ "max": 3800.0
1078
+ },
1079
+ {
1080
+ "current": 2000.0,
1081
+ "min": 800.0,
1082
+ "max": 3800.0
1083
+ },
1084
+ {
1085
+ "current": 2000.0,
1086
+ "min": 800.0,
1087
+ "max": 3800.0
1088
+ },
1089
+ {
1090
+ "current": 2000.0,
1091
+ "min": 800.0,
1092
+ "max": 3800.0
1093
+ },
1094
+ {
1095
+ "current": 2000.0,
1096
+ "min": 800.0,
1097
+ "max": 3800.0
1098
+ },
1099
+ {
1100
+ "current": 2000.0,
1101
+ "min": 800.0,
1102
+ "max": 3800.0
1103
+ },
1104
+ {
1105
+ "current": 2000.0,
1106
+ "min": 800.0,
1107
+ "max": 3800.0
1108
+ },
1109
+ {
1110
+ "current": 2000.0,
1111
+ "min": 800.0,
1112
+ "max": 3800.0
1113
+ },
1114
+ {
1115
+ "current": 2000.0,
1116
+ "min": 800.0,
1117
+ "max": 3800.0
1118
+ },
1119
+ {
1120
+ "current": 2000.0,
1121
+ "min": 800.0,
1122
+ "max": 3800.0
1123
+ },
1124
+ {
1125
+ "current": 2000.0,
1126
+ "min": 800.0,
1127
+ "max": 3800.0
1128
+ },
1129
+ {
1130
+ "current": 2000.0,
1131
+ "min": 800.0,
1132
+ "max": 3800.0
1133
+ },
1134
+ {
1135
+ "current": 2000.0,
1136
+ "min": 800.0,
1137
+ "max": 3800.0
1138
+ },
1139
+ {
1140
+ "current": 2000.0,
1141
+ "min": 800.0,
1142
+ "max": 3800.0
1143
+ },
1144
+ {
1145
+ "current": 2000.0,
1146
+ "min": 800.0,
1147
+ "max": 3800.0
1148
+ },
1149
+ {
1150
+ "current": 2000.0,
1151
+ "min": 800.0,
1152
+ "max": 3800.0
1153
+ },
1154
+ {
1155
+ "current": 2000.0,
1156
+ "min": 800.0,
1157
+ "max": 3800.0
1158
+ },
1159
+ {
1160
+ "current": 2000.0,
1161
+ "min": 800.0,
1162
+ "max": 3800.0
1163
+ },
1164
+ {
1165
+ "current": 2000.0,
1166
+ "min": 800.0,
1167
+ "max": 3800.0
1168
+ }
1169
+ ],
1170
+ "disk": {
1171
+ "/": {
1172
+ "total": 1758.8549690246582,
1173
+ "used": 14.71224594116211
1174
+ }
1175
+ },
1176
+ "gpu": "NVIDIA H800",
1177
+ "gpu_count": 8,
1178
+ "gpu_devices": [
1179
+ {
1180
+ "name": "NVIDIA H800",
1181
+ "memory_total": 85520809984
1182
+ },
1183
+ {
1184
+ "name": "NVIDIA H800",
1185
+ "memory_total": 85520809984
1186
+ },
1187
+ {
1188
+ "name": "NVIDIA H800",
1189
+ "memory_total": 85520809984
1190
+ },
1191
+ {
1192
+ "name": "NVIDIA H800",
1193
+ "memory_total": 85520809984
1194
+ },
1195
+ {
1196
+ "name": "NVIDIA H800",
1197
+ "memory_total": 85520809984
1198
+ },
1199
+ {
1200
+ "name": "NVIDIA H800",
1201
+ "memory_total": 85520809984
1202
+ },
1203
+ {
1204
+ "name": "NVIDIA H800",
1205
+ "memory_total": 85520809984
1206
+ },
1207
+ {
1208
+ "name": "NVIDIA H800",
1209
+ "memory_total": 85520809984
1210
+ }
1211
+ ],
1212
+ "memory": {
1213
+ "total": 2015.5641632080078
1214
+ }
1215
+ }
wandb/run-20240921_103042-1p62y7m7/files/wandb-summary.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"train/step": 166, "train/loss": 2.7490217685699463, "train/reward": -0.8869644403457642, "train/better_sample_reward": -0.6029175519943237, "train/worse_sample_reward": -0.2840469181537628, "train/reward_accuracy": 0.5, "train/reward_margin": -0.3188706040382385, "train/lr": 7.861083133307247e-07, "train/epoch": 0.9378531073446328, "_timestamp": 1726887218.607224, "_runtime": 1376.2130439281464, "_step": 166}
wandb/run-20240921_103042-1p62y7m7/logs/debug-internal.log ADDED
The diff for this file is too large to render. See raw diff
 
wandb/run-20240921_103042-1p62y7m7/logs/debug.log ADDED
@@ -0,0 +1,29 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ 2024-09-21 10:30:42,388 INFO MainThread:2677650 [wandb_setup.py:_flush():76] Current SDK version is 0.17.5
2
+ 2024-09-21 10:30:42,389 INFO MainThread:2677650 [wandb_setup.py:_flush():76] Configure stats pid to 2677650
3
+ 2024-09-21 10:30:42,389 INFO MainThread:2677650 [wandb_setup.py:_flush():76] Loading settings from /home/yangyaodong/.config/wandb/settings
4
+ 2024-09-21 10:30:42,389 INFO MainThread:2677650 [wandb_setup.py:_flush():76] Loading settings from /aifs4su/yaodong/projects/hantao/dev_cham/align-anything/scripts/wandb/settings
5
+ 2024-09-21 10:30:42,389 INFO MainThread:2677650 [wandb_setup.py:_flush():76] Loading settings from environment variables: {'api_key': '***REDACTED***'}
6
+ 2024-09-21 10:30:42,389 INFO MainThread:2677650 [wandb_setup.py:_flush():76] Applying setup settings: {'_disable_service': False}
7
+ 2024-09-21 10:30:42,389 WARNING MainThread:2677650 [wandb_setup.py:_flush():76] Could not find program at -m align_anything.trainers.tiv_to_t.dpo
8
+ 2024-09-21 10:30:42,389 INFO MainThread:2677650 [wandb_setup.py:_flush():76] Inferring run settings from compute environment: {'program_relpath': None, 'program': '-m align_anything.trainers.tiv_to_t.dpo'}
9
+ 2024-09-21 10:30:42,389 INFO MainThread:2677650 [wandb_setup.py:_flush():76] Applying login settings: {}
10
+ 2024-09-21 10:30:42,389 INFO MainThread:2677650 [wandb_init.py:_log_setup():529] Logging user logs to ../outputs/dpo_tiv2t_1.5k_base/wandb/run-20240921_103042-1p62y7m7/logs/debug.log
11
+ 2024-09-21 10:30:42,389 INFO MainThread:2677650 [wandb_init.py:_log_setup():530] Logging internal logs to ../outputs/dpo_tiv2t_1.5k_base/wandb/run-20240921_103042-1p62y7m7/logs/debug-internal.log
12
+ 2024-09-21 10:30:42,389 INFO MainThread:2677650 [wandb_init.py:init():569] calling init triggers
13
+ 2024-09-21 10:30:42,389 INFO MainThread:2677650 [wandb_init.py:init():576] wandb.init called with sweep_config: {}
14
+ config: {'train_cfgs': {'ds_cfgs': 'ds_z3_config.json', 'epochs': 3, 'seed': 42, 'per_device_train_batch_size': 1.0, 'per_device_eval_batch_size': 1.0, 'gradient_accumulation_steps': 1.0, 'gradient_checkpointing': True, 'learning_rate': 1e-06, 'lr_scheduler_type': 'cosine', 'lr_warmup_ratio': 0.01, 'weight_decay': 0.0, 'adam_betas': [0.9, 0.95], 'bf16': True, 'fp16': False, 'eval_strategy': 'epoch', 'eval_interval': 10, 'regularization': 0.001, 'scale_coeff': 0.1, 'freeze_mm_proj': False, 'freeze_vision_tower': True, 'freeze_language_model': False}, 'data_cfgs': {'train_datasets': '/aifs4su/yaodong/datasets/aaa_dataset/TV2T-preference/extracted', 'train_template': 'NExTQA_preference', 'train_size': None, 'train_split': 'train', 'train_subset': None, 'train_data_files': 'extracted_preference_1.5k_washed.json', 'train_optional_args': [], 'eval_datasets': None, 'eval_template': None, 'eval_size': None, 'eval_split': None, 'eval_subset': None, 'eval_data_files': None, 'eval_optional_args': []}, 'logger_cfgs': {'log_type': 'wandb', 'log_project': 'align-anything', 'log_run_name': 'dpo', 'output_dir': '../outputs/dpo_tiv2t_1.5k_base', 'cache_dir': None, 'save_interval': 100000}, 'model_cfgs': {'model_name_or_path': '/aifs4su/yaodong/models/Qwen2-VL-7B-Instruct', 'trust_remote_code': True, 'model_max_length': 4096}, 'special_tokens': None}
15
+ 2024-09-21 10:30:42,389 INFO MainThread:2677650 [wandb_init.py:init():619] starting backend
16
+ 2024-09-21 10:30:42,389 INFO MainThread:2677650 [wandb_init.py:init():623] setting up manager
17
+ 2024-09-21 10:30:42,390 INFO MainThread:2677650 [backend.py:_multiprocessing_setup():105] multiprocessing start_methods=fork,spawn,forkserver, using: spawn
18
+ 2024-09-21 10:30:42,393 INFO MainThread:2677650 [wandb_init.py:init():631] backend started and connected
19
+ 2024-09-21 10:30:42,395 INFO MainThread:2677650 [wandb_init.py:init():720] updated telemetry
20
+ 2024-09-21 10:30:42,415 INFO MainThread:2677650 [wandb_init.py:init():753] communicating run to backend with 90.0 second timeout
21
+ 2024-09-21 10:30:42,928 INFO MainThread:2677650 [wandb_run.py:_on_init():2435] communicating current version
22
+ 2024-09-21 10:30:43,096 INFO MainThread:2677650 [wandb_run.py:_on_init():2444] got version response upgrade_message: "wandb version 0.18.1 is available! To upgrade, please run:\n $ pip install wandb --upgrade"
23
+
24
+ 2024-09-21 10:30:43,097 INFO MainThread:2677650 [wandb_init.py:init():804] starting run threads in backend
25
+ 2024-09-21 10:30:48,117 INFO MainThread:2677650 [wandb_run.py:_console_start():2413] atexit reg
26
+ 2024-09-21 10:30:48,117 INFO MainThread:2677650 [wandb_run.py:_redirect():2255] redirect: wrap_raw
27
+ 2024-09-21 10:30:48,117 INFO MainThread:2677650 [wandb_run.py:_redirect():2320] Wrapping output streams.
28
+ 2024-09-21 10:30:48,117 INFO MainThread:2677650 [wandb_run.py:_redirect():2345] Redirects installed.
29
+ 2024-09-21 10:30:48,121 INFO MainThread:2677650 [wandb_init.py:init():847] run started, returning control to user process
wandb/run-20240921_103042-1p62y7m7/run-1p62y7m7.wandb ADDED
Binary file (557 kB). View file
 
wandb/run-20240921_111222-4ony16ec/files/conda-environment.yaml ADDED
@@ -0,0 +1,516 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ name: hantao_tiv
2
+ channels:
3
+ - nvidia/label/cuda-12.1.0
4
+ - nvidia
5
+ - pytorch
6
+ - huggingface
7
+ - conda-forge
8
+ - defaults
9
+ dependencies:
10
+ - _libgcc_mutex=0.1=conda_forge
11
+ - _openmp_mutex=4.5=2_gnu
12
+ - aom=3.9.1=hac33072_0
13
+ - asttokens=2.4.1=pyhd8ed1ab_0
14
+ - blas=1.0=mkl
15
+ - brotli-python=1.1.0=py311hb755f60_1
16
+ - bzip2=1.0.8=h4bc722e_7
17
+ - ca-certificates=2024.7.4=hbcca054_0
18
+ - cairo=1.18.0=hebfffa5_3
19
+ - certifi=2024.7.4=pyhd8ed1ab_0
20
+ - cffi=1.16.0=py311hb3a22ac_0
21
+ - charset-normalizer=3.3.2=pyhd8ed1ab_0
22
+ - comm=0.2.2=pyhd8ed1ab_0
23
+ - cuda=12.1.0=0
24
+ - cuda-cccl=12.1.55=0
25
+ - cuda-command-line-tools=12.1.0=0
26
+ - cuda-compiler=12.1.0=0
27
+ - cuda-cudart=12.1.55=0
28
+ - cuda-cudart-dev=12.1.55=0
29
+ - cuda-cudart-static=12.1.55=0
30
+ - cuda-cuobjdump=12.1.55=0
31
+ - cuda-cupti=12.1.62=0
32
+ - cuda-cupti-static=12.1.62=0
33
+ - cuda-cuxxfilt=12.1.55=0
34
+ - cuda-demo-suite=12.1.55=0
35
+ - cuda-documentation=12.1.55=0
36
+ - cuda-driver-dev=12.1.55=0
37
+ - cuda-gdb=12.1.55=0
38
+ - cuda-libraries=12.1.0=0
39
+ - cuda-libraries-dev=12.1.0=0
40
+ - cuda-libraries-static=12.1.0=0
41
+ - cuda-nsight=12.1.55=0
42
+ - cuda-nsight-compute=12.1.0=0
43
+ - cuda-nvcc=12.1.66=0
44
+ - cuda-nvdisasm=12.1.55=0
45
+ - cuda-nvml-dev=12.1.55=0
46
+ - cuda-nvprof=12.1.55=0
47
+ - cuda-nvprune=12.1.55=0
48
+ - cuda-nvrtc=12.1.55=0
49
+ - cuda-nvrtc-dev=12.1.55=0
50
+ - cuda-nvrtc-static=12.1.55=0
51
+ - cuda-nvtx=12.1.66=0
52
+ - cuda-nvvp=12.1.55=0
53
+ - cuda-opencl=12.1.56=0
54
+ - cuda-opencl-dev=12.1.56=0
55
+ - cuda-profiler-api=12.1.55=0
56
+ - cuda-runtime=12.1.0=0
57
+ - cuda-sanitizer-api=12.1.55=0
58
+ - cuda-toolkit=12.1.0=0
59
+ - cuda-tools=12.1.0=0
60
+ - cuda-visual-tools=12.1.0=0
61
+ - dav1d=1.2.1=hd590300_0
62
+ - debugpy=1.8.2=py311h4332511_0
63
+ - exceptiongroup=1.2.2=pyhd8ed1ab_0
64
+ - executing=2.0.1=pyhd8ed1ab_0
65
+ - expat=2.6.2=h59595ed_0
66
+ - ffmpeg=7.0.1=gpl_h9be9148_104
67
+ - filelock=3.15.4=pyhd8ed1ab_0
68
+ - font-ttf-dejavu-sans-mono=2.37=hab24e00_0
69
+ - font-ttf-inconsolata=3.000=h77eed37_0
70
+ - font-ttf-source-code-pro=2.038=h77eed37_0
71
+ - font-ttf-ubuntu=0.83=h77eed37_2
72
+ - fontconfig=2.14.2=h14ed4e7_0
73
+ - fonts-conda-ecosystem=1=0
74
+ - fonts-conda-forge=1=0
75
+ - freetype=2.12.1=h267a509_2
76
+ - fribidi=1.0.10=h36c2ea0_0
77
+ - gds-tools=1.6.0.25=0
78
+ - gettext=0.22.5=h59595ed_2
79
+ - gettext-tools=0.22.5=h59595ed_2
80
+ - git-lfs=3.5.1=ha770c72_0
81
+ - gmp=6.3.0=hac33072_2
82
+ - gmpy2=2.1.5=py311hc4f1f91_1
83
+ - gnutls=3.7.9=hb077bed_0
84
+ - graphite2=1.3.13=h59595ed_1003
85
+ - h2=4.1.0=pyhd8ed1ab_0
86
+ - harfbuzz=9.0.0=hda332d3_1
87
+ - hpack=4.0.0=pyh9f0ad1d_0
88
+ - hyperframe=6.0.1=pyhd8ed1ab_0
89
+ - icu=75.1=he02047a_0
90
+ - idna=3.7=pyhd8ed1ab_0
91
+ - importlib-metadata=8.2.0=pyha770c72_0
92
+ - importlib_metadata=8.2.0=hd8ed1ab_0
93
+ - intel-openmp=2022.0.1=h06a4308_3633
94
+ - ipykernel=6.29.5=pyh3099207_0
95
+ - ipython=8.26.0=pyh707e725_0
96
+ - jedi=0.19.1=pyhd8ed1ab_0
97
+ - jinja2=3.1.4=pyhd8ed1ab_0
98
+ - jupyter_client=8.6.2=pyhd8ed1ab_0
99
+ - jupyter_core=5.7.2=py311h38be061_0
100
+ - keyutils=1.6.1=h166bdaf_0
101
+ - krb5=1.21.3=h659f571_0
102
+ - lame=3.100=h166bdaf_1003
103
+ - lcms2=2.16=hb7c19ff_0
104
+ - ld_impl_linux-64=2.40=hf3520f5_7
105
+ - lerc=4.0.0=h27087fc_0
106
+ - libabseil=20240116.2=cxx17_he02047a_1
107
+ - libasprintf=0.22.5=h661eb56_2
108
+ - libasprintf-devel=0.22.5=h661eb56_2
109
+ - libass=0.17.1=h39113c1_2
110
+ - libblas=3.9.0=16_linux64_mkl
111
+ - libcblas=3.9.0=16_linux64_mkl
112
+ - libcublas=12.1.0.26=0
113
+ - libcublas-dev=12.1.0.26=0
114
+ - libcublas-static=12.1.0.26=0
115
+ - libcufft=11.0.2.4=0
116
+ - libcufft-dev=11.0.2.4=0
117
+ - libcufft-static=11.0.2.4=0
118
+ - libcufile=1.6.0.25=0
119
+ - libcufile-dev=1.6.0.25=0
120
+ - libcufile-static=1.6.0.25=0
121
+ - libcurand=10.3.2.56=0
122
+ - libcurand-dev=10.3.2.56=0
123
+ - libcurand-static=10.3.2.56=0
124
+ - libcusolver=11.4.4.55=0
125
+ - libcusolver-dev=11.4.4.55=0
126
+ - libcusolver-static=11.4.4.55=0
127
+ - libcusparse=12.0.2.55=0
128
+ - libcusparse-dev=12.0.2.55=0
129
+ - libcusparse-static=12.0.2.55=0
130
+ - libdeflate=1.20=hd590300_0
131
+ - libdrm=2.4.122=h4ab18f5_0
132
+ - libedit=3.1.20191231=he28a2e2_2
133
+ - libexpat=2.6.2=h59595ed_0
134
+ - libffi=3.4.2=h7f98852_5
135
+ - libgcc-ng=14.1.0=h77fa898_0
136
+ - libgettextpo=0.22.5=h59595ed_2
137
+ - libgettextpo-devel=0.22.5=h59595ed_2
138
+ - libglib=2.80.3=h8a4344b_1
139
+ - libgomp=14.1.0=h77fa898_0
140
+ - libhwloc=2.11.1=default_hecaa2ac_1000
141
+ - libiconv=1.17=hd590300_2
142
+ - libidn2=2.3.7=hd590300_0
143
+ - libjpeg-turbo=3.0.0=hd590300_1
144
+ - liblapack=3.9.0=16_linux64_mkl
145
+ - libnpp=12.0.2.50=0
146
+ - libnpp-dev=12.0.2.50=0
147
+ - libnpp-static=12.0.2.50=0
148
+ - libnsl=2.0.1=hd590300_0
149
+ - libnvjitlink=12.1.105=0
150
+ - libnvjitlink-dev=12.1.55=0
151
+ - libnvjpeg=12.1.0.39=0
152
+ - libnvjpeg-dev=12.1.0.39=0
153
+ - libnvjpeg-static=12.1.0.39=0
154
+ - libnvvm-samples=12.1.55=0
155
+ - libopenvino=2024.2.0=h2da1b83_1
156
+ - libopenvino-auto-batch-plugin=2024.2.0=hb045406_1
157
+ - libopenvino-auto-plugin=2024.2.0=hb045406_1
158
+ - libopenvino-hetero-plugin=2024.2.0=h5c03a75_1
159
+ - libopenvino-intel-cpu-plugin=2024.2.0=h2da1b83_1
160
+ - libopenvino-intel-gpu-plugin=2024.2.0=h2da1b83_1
161
+ - libopenvino-intel-npu-plugin=2024.2.0=he02047a_1
162
+ - libopenvino-ir-frontend=2024.2.0=h5c03a75_1
163
+ - libopenvino-onnx-frontend=2024.2.0=h07e8aee_1
164
+ - libopenvino-paddle-frontend=2024.2.0=h07e8aee_1
165
+ - libopenvino-pytorch-frontend=2024.2.0=he02047a_1
166
+ - libopenvino-tensorflow-frontend=2024.2.0=h39126c6_1
167
+ - libopenvino-tensorflow-lite-frontend=2024.2.0=he02047a_1
168
+ - libopus=1.3.1=h7f98852_1
169
+ - libpciaccess=0.18=hd590300_0
170
+ - libpng=1.6.43=h2797004_0
171
+ - libprotobuf=4.25.3=h08a7969_0
172
+ - libsodium=1.0.18=h36c2ea0_1
173
+ - libsqlite=3.46.0=hde9e2c9_0
174
+ - libstdcxx-ng=14.1.0=hc0a3c3a_0
175
+ - libtasn1=4.19.0=h166bdaf_0
176
+ - libtiff=4.6.0=h1dd3fc0_3
177
+ - libunistring=0.9.10=h7f98852_0
178
+ - libuuid=2.38.1=h0b41bf4_0
179
+ - libva=2.22.0=hb711507_0
180
+ - libvpx=1.14.1=hac33072_0
181
+ - libwebp-base=1.4.0=hd590300_0
182
+ - libxcb=1.16=hd590300_0
183
+ - libxcrypt=4.4.36=hd590300_1
184
+ - libxml2=2.12.7=he7c6b58_4
185
+ - libzlib=1.3.1=h4ab18f5_1
186
+ - llvm-openmp=15.0.7=h0cdce71_0
187
+ - markupsafe=2.1.5=py311h459d7ec_0
188
+ - matplotlib-inline=0.1.7=pyhd8ed1ab_0
189
+ - mkl=2022.1.0=hc2b9512_224
190
+ - mpc=1.3.1=hfe3b2da_0
191
+ - mpfr=4.2.1=h38ae2d0_2
192
+ - mpmath=1.3.0=pyhd8ed1ab_0
193
+ - ncurses=6.5=h59595ed_0
194
+ - nest-asyncio=1.6.0=pyhd8ed1ab_0
195
+ - nettle=3.9.1=h7ab15ed_0
196
+ - networkx=3.3=pyhd8ed1ab_1
197
+ - nsight-compute=2023.1.0.15=0
198
+ - ocl-icd=2.3.2=hd590300_1
199
+ - openh264=2.4.1=h59595ed_0
200
+ - openjpeg=2.5.2=h488ebb8_0
201
+ - openssl=3.3.1=h4bc722e_2
202
+ - p11-kit=0.24.1=hc5aa10d_0
203
+ - packaging=24.1=pyhd8ed1ab_0
204
+ - parso=0.8.4=pyhd8ed1ab_0
205
+ - pcre2=10.44=h0f59acf_0
206
+ - pexpect=4.9.0=pyhd8ed1ab_0
207
+ - pickleshare=0.7.5=py_1003
208
+ - pillow=10.4.0=py311h82a398c_0
209
+ - pip=24.0=pyhd8ed1ab_0
210
+ - pixman=0.43.2=h59595ed_0
211
+ - prompt-toolkit=3.0.47=pyha770c72_0
212
+ - psutil=6.0.0=py311h331c9d8_0
213
+ - pthread-stubs=0.4=h36c2ea0_1001
214
+ - ptyprocess=0.7.0=pyhd3deb0d_0
215
+ - pugixml=1.14=h59595ed_0
216
+ - pure_eval=0.2.3=pyhd8ed1ab_0
217
+ - pycparser=2.22=pyhd8ed1ab_0
218
+ - pygments=2.18.0=pyhd8ed1ab_0
219
+ - pysocks=1.7.1=pyha2e5f31_6
220
+ - python=3.11.9=hb806964_0_cpython
221
+ - python_abi=3.11=4_cp311
222
+ - pytorch=2.4.0=py3.11_cuda12.1_cudnn9.1.0_0
223
+ - pytorch-cuda=12.1=ha16c6d3_5
224
+ - pytorch-mutex=1.0=cuda
225
+ - pyyaml=6.0.1=py311h459d7ec_1
226
+ - pyzmq=26.0.3=py311h08a0b41_0
227
+ - readline=8.2=h8228510_1
228
+ - requests=2.32.3=pyhd8ed1ab_0
229
+ - setuptools=71.0.4=pyhd8ed1ab_0
230
+ - six=1.16.0=pyh6c4a22f_0
231
+ - snappy=1.2.1=ha2e4443_0
232
+ - stack_data=0.6.2=pyhd8ed1ab_0
233
+ - svt-av1=2.1.2=hac33072_0
234
+ - sympy=1.13.0=pypyh2585a3b_103
235
+ - tbb=2021.12.0=h434a139_3
236
+ - tk=8.6.13=noxft_h4845f30_101
237
+ - torchaudio=2.4.0=py311_cu121
238
+ - torchtriton=3.0.0=py311
239
+ - tornado=6.4.1=py311h331c9d8_0
240
+ - traitlets=5.14.3=pyhd8ed1ab_0
241
+ - typing_extensions=4.12.2=pyha770c72_0
242
+ - urllib3=2.2.2=pyhd8ed1ab_1
243
+ - wayland=1.23.0=h5291e77_0
244
+ - wayland-protocols=1.36=hd8ed1ab_0
245
+ - wcwidth=0.2.13=pyhd8ed1ab_0
246
+ - wheel=0.43.0=pyhd8ed1ab_1
247
+ - x264=1!164.3095=h166bdaf_2
248
+ - x265=3.5=h924138e_3
249
+ - xorg-fixesproto=5.0=h7f98852_1002
250
+ - xorg-kbproto=1.0.7=h7f98852_1002
251
+ - xorg-libice=1.1.1=hd590300_0
252
+ - xorg-libsm=1.2.4=h7391055_0
253
+ - xorg-libx11=1.8.9=hb711507_1
254
+ - xorg-libxau=1.0.11=hd590300_0
255
+ - xorg-libxdmcp=1.1.3=h7f98852_0
256
+ - xorg-libxext=1.3.4=h0b41bf4_2
257
+ - xorg-libxfixes=5.0.3=h7f98852_1004
258
+ - xorg-libxrender=0.9.11=hd590300_0
259
+ - xorg-renderproto=0.11.1=h7f98852_1002
260
+ - xorg-xextproto=7.3.0=h0b41bf4_1003
261
+ - xorg-xproto=7.0.31=h7f98852_1007
262
+ - xz=5.2.6=h166bdaf_0
263
+ - yaml=0.2.5=h7f98852_2
264
+ - zeromq=4.3.5=h75354e8_4
265
+ - zipp=3.19.2=pyhd8ed1ab_0
266
+ - zlib=1.3.1=h4ab18f5_1
267
+ - zstandard=0.23.0=py311h5cd10c7_0
268
+ - zstd=1.5.6=ha6fb4c9_0
269
+ - pip:
270
+ - about-time==4.2.1
271
+ - absl-py==2.1.0
272
+ - accelerate==0.34.0
273
+ - aiofiles==23.2.1
274
+ - aiohttp==3.9.5
275
+ - aiohttp-retry==2.8.3
276
+ - aiosignal==1.3.1
277
+ - align-anything==0.0.1.dev0
278
+ - alive-progress==3.1.5
279
+ - amqp==5.2.0
280
+ - annotated-types==0.7.0
281
+ - antlr4-python3-runtime==4.9.3
282
+ - anyio==4.4.0
283
+ - appdirs==1.4.4
284
+ - asyncssh==2.16.0
285
+ - atpublic==5.0
286
+ - attrs==23.2.0
287
+ - audioread==3.0.1
288
+ - backoff==2.2.1
289
+ - billiard==4.2.0
290
+ - boto3==1.35.9
291
+ - botocore==1.35.9
292
+ - cachetools==5.4.0
293
+ - celery==5.4.0
294
+ - cfgv==3.4.0
295
+ - click==8.1.7
296
+ - click-didyoumean==0.3.1
297
+ - click-plugins==1.1.1
298
+ - click-repl==0.3.0
299
+ - cloudpickle==3.0.0
300
+ - cmake==3.30.1
301
+ - colorama==0.4.6
302
+ - commonmark==0.9.1
303
+ - configobj==5.0.8
304
+ - contourpy==1.2.1
305
+ - cryptography==43.0.0
306
+ - cycler==0.12.1
307
+ - dacite==1.6.0
308
+ - dagshub==0.3.35
309
+ - dagshub-annotation-converter==0.1.0
310
+ - dataclasses-json==0.6.7
311
+ - datasets==2.20.0
312
+ - decorator==4.4.2
313
+ - deepspeed==0.14.4
314
+ - dictdiffer==0.9.0
315
+ - diffusers==0.29.2
316
+ - dill==0.3.8
317
+ - diskcache==5.6.3
318
+ - distlib==0.3.8
319
+ - distro==1.9.0
320
+ - dnspython==2.6.1
321
+ - docker-pycreds==0.4.0
322
+ - docstring-parser==0.16
323
+ - dpath==2.2.0
324
+ - dulwich==0.22.1
325
+ - dvc==3.55.1
326
+ - dvc-data==3.16.5
327
+ - dvc-http==2.32.0
328
+ - dvc-objects==5.1.0
329
+ - dvc-render==1.0.2
330
+ - dvc-studio-client==0.21.0
331
+ - dvc-task==0.4.0
332
+ - einops==0.8.0
333
+ - email-validator==2.2.0
334
+ - entrypoints==0.4
335
+ - fastapi==0.111.1
336
+ - fastapi-cli==0.0.4
337
+ - ffmpy==0.3.3
338
+ - fire==0.6.0
339
+ - flatten-dict==0.4.2
340
+ - flufl-lock==8.1.0
341
+ - fonttools==4.53.1
342
+ - frozenlist==1.4.1
343
+ - fsspec==2024.5.0
344
+ - funcy==2.0
345
+ - fusepy==3.0.1
346
+ - gitdb==4.0.11
347
+ - gitpython==3.1.43
348
+ - gql==3.5.0
349
+ - gradio==4.39.0
350
+ - gradio-client==1.1.1
351
+ - gradio-multimodalchatbot==0.0.1
352
+ - grandalf==0.8
353
+ - grapheme==0.6.0
354
+ - graphql-core==3.2.3
355
+ - grpcio==1.65.1
356
+ - gto==1.7.1
357
+ - h11==0.14.0
358
+ - hjson==3.1.0
359
+ - httpcore==1.0.5
360
+ - httptools==0.6.1
361
+ - httpx==0.27.2
362
+ - huggingface-hub==0.24.3
363
+ - hydra-core==1.3.2
364
+ - identify==2.6.0
365
+ - imageio==2.35.1
366
+ - imageio-ffmpeg==0.5.1
367
+ - importlib-resources==6.4.0
368
+ - iniconfig==2.0.0
369
+ - interegular==0.3.3
370
+ - iterative-telemetry==0.0.8
371
+ - jmespath==1.0.1
372
+ - joblib==1.4.2
373
+ - jsonschema==4.23.0
374
+ - jsonschema-specifications==2023.12.1
375
+ - kiwisolver==1.4.5
376
+ - kombu==5.4.0
377
+ - lark==1.1.9
378
+ - lazy-loader==0.4
379
+ - librosa==0.10.2.post1
380
+ - llamafactory==0.8.4.dev0
381
+ - llvmlite==0.43.0
382
+ - lm-format-enforcer==0.10.3
383
+ - lxml==5.3.0
384
+ - markdown==3.6
385
+ - markdown-it-py==3.0.0
386
+ - marshmallow==3.22.0
387
+ - matplotlib==3.9.1
388
+ - mdurl==0.1.2
389
+ - mmsg==0.1.dev14+gbd2b056.d20240803
390
+ - moviepy==1.0.3
391
+ - mpi4py==4.0.0
392
+ - msgpack==1.0.8
393
+ - multidict==6.0.5
394
+ - multiprocess==0.70.16
395
+ - mypy-extensions==1.0.0
396
+ - ninja==1.11.1.1
397
+ - nodeenv==1.9.1
398
+ - numba==0.60.0
399
+ - numpy==1.26.4
400
+ - nvidia-cublas-cu12==12.1.3.1
401
+ - nvidia-cuda-cupti-cu12==12.1.105
402
+ - nvidia-cuda-nvrtc-cu12==12.1.105
403
+ - nvidia-cuda-runtime-cu12==12.1.105
404
+ - nvidia-cudnn-cu12==8.9.2.26
405
+ - nvidia-cufft-cu12==11.0.2.54
406
+ - nvidia-curand-cu12==10.3.2.106
407
+ - nvidia-cusolver-cu12==11.4.5.107
408
+ - nvidia-cusparse-cu12==12.1.0.106
409
+ - nvidia-ml-py==12.535.161
410
+ - nvidia-nccl-cu12==2.20.5
411
+ - nvidia-nvjitlink-cu12==12.5.82
412
+ - nvidia-nvtx-cu12==12.1.105
413
+ - nvitop==1.3.2
414
+ - omegaconf==2.3.0
415
+ - openai==1.37.1
416
+ - optree==0.12.1
417
+ - orjson==3.10.6
418
+ - outlines==0.0.47.dev37+g26e2934
419
+ - pandas==2.2.2
420
+ - pathspec==0.12.1
421
+ - pathvalidate==3.0.0
422
+ - peft==0.12.0
423
+ - platformdirs==3.11.0
424
+ - pluggy==1.5.0
425
+ - pooch==1.8.2
426
+ - pre-commit==3.8.0
427
+ - proglog==0.1.10
428
+ - prometheus-client==0.20.0
429
+ - prometheus-fastapi-instrumentator==7.0.0
430
+ - protobuf==4.25.4
431
+ - py-cpuinfo==9.0.0
432
+ - pyairports==2.1.1
433
+ - pyarrow==17.0.0
434
+ - pyarrow-hotfix==0.6
435
+ - pyav==13.0.0
436
+ - pycountry==24.6.1
437
+ - pydantic==2.8.2
438
+ - pydantic-core==2.20.1
439
+ - pydot==3.0.1
440
+ - pydub==0.25.1
441
+ - pygit2==1.15.1
442
+ - pygtrie==2.5.0
443
+ - pyparsing==3.1.2
444
+ - pytest==8.3.2
445
+ - python-dateutil==2.9.0.post0
446
+ - python-dotenv==1.0.1
447
+ - python-multipart==0.0.9
448
+ - pytz==2024.1
449
+ - ranger-fm==1.9.3
450
+ - ray==2.34.0
451
+ - referencing==0.35.1
452
+ - regex==2024.7.24
453
+ - requests-toolbelt==1.0.0
454
+ - rfc3986==1.5.0
455
+ - rich==13.1.0
456
+ - rpds-py==0.19.1
457
+ - ruamel-yaml==0.18.6
458
+ - ruamel-yaml-clib==0.2.8
459
+ - ruff==0.5.5
460
+ - s3transfer==0.10.2
461
+ - safetensors==0.4.3
462
+ - scikit-learn==1.5.1
463
+ - scipy==1.14.0
464
+ - scmrepo==3.3.7
465
+ - semantic-version==2.10.0
466
+ - semver==3.0.2
467
+ - sentencepiece==0.2.0
468
+ - sentry-sdk==2.11.0
469
+ - setproctitle==1.3.3
470
+ - shellingham==1.5.4
471
+ - shortuuid==1.0.13
472
+ - shtab==1.7.1
473
+ - smmap==5.0.1
474
+ - sniffio==1.3.1
475
+ - soundfile==0.12.1
476
+ - soxr==0.4.0
477
+ - sqltrie==0.11.1
478
+ - sse-starlette==2.1.3
479
+ - starlette==0.37.2
480
+ - tabulate==0.9.0
481
+ - tenacity==8.2.3
482
+ - tensorboard==2.17.0
483
+ - tensorboard-data-server==0.7.2
484
+ - term-image==0.7.2
485
+ - termcolor==2.4.0
486
+ - threadpoolctl==3.5.0
487
+ - tiktoken==0.7.0
488
+ - tokenizers==0.19.1
489
+ - tomlkit==0.12.0
490
+ - torch==2.3.1
491
+ - torchvision==0.18.1
492
+ - tqdm==4.66.4
493
+ - transformers==4.45.0.dev0
494
+ - treelib==1.6.4
495
+ - triton==2.3.1
496
+ - trl==0.9.6
497
+ - typer==0.12.3
498
+ - typing-inspect==0.9.0
499
+ - tyro==0.8.10
500
+ - tzdata==2024.1
501
+ - uvicorn==0.30.3
502
+ - uvloop==0.19.0
503
+ - vine==5.1.0
504
+ - virtualenv==20.26.3
505
+ - vllm==0.5.3.post1
506
+ - vllm-flash-attn==2.5.9.post1
507
+ - voluptuous==0.15.2
508
+ - wandb==0.17.5
509
+ - watchfiles==0.22.0
510
+ - websockets==11.0.3
511
+ - werkzeug==3.0.3
512
+ - xformers==0.0.27
513
+ - xxhash==3.4.1
514
+ - yarl==1.9.4
515
+ - zc-lockfile==3.0.post1
516
+ prefix: /aifs4su/yaodong/miniconda3/envs/hantao_tiv
wandb/run-20240921_111222-4ony16ec/files/config.yaml ADDED
@@ -0,0 +1,112 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ wandb_version: 1
2
+
3
+ train_cfgs:
4
+ desc: null
5
+ value:
6
+ ds_cfgs: ds_z3_config.json
7
+ epochs: 3
8
+ seed: 42
9
+ per_device_train_batch_size: 1.0
10
+ per_device_eval_batch_size: 1.0
11
+ gradient_accumulation_steps: 1.0
12
+ gradient_checkpointing: true
13
+ learning_rate: 1.0e-06
14
+ lr_scheduler_type: cosine
15
+ lr_warmup_ratio: 0.01
16
+ weight_decay: 0.0
17
+ adam_betas:
18
+ - 0.9
19
+ - 0.95
20
+ bf16: true
21
+ fp16: false
22
+ eval_strategy: epoch
23
+ eval_interval: 10
24
+ regularization: 0.001
25
+ scale_coeff: 0.1
26
+ freeze_mm_proj: false
27
+ freeze_vision_tower: true
28
+ freeze_language_model: false
29
+ data_cfgs:
30
+ desc: null
31
+ value:
32
+ train_datasets: /aifs4su/yaodong/datasets/aaa_dataset/TV2T-preference/extracted
33
+ train_template: NExTQA_preference
34
+ train_size: null
35
+ train_split: train
36
+ train_subset: null
37
+ train_data_files: 1.5k_clean_duplicate.json
38
+ train_optional_args: []
39
+ eval_datasets: null
40
+ eval_template: null
41
+ eval_size: null
42
+ eval_split: null
43
+ eval_subset: null
44
+ eval_data_files: null
45
+ eval_optional_args: []
46
+ logger_cfgs:
47
+ desc: null
48
+ value:
49
+ log_type: wandb
50
+ log_project: align-anything
51
+ log_run_name: dpo
52
+ output_dir: ../outputs/dpo_tiv2t_1.5k_base
53
+ cache_dir: null
54
+ save_interval: 100000
55
+ model_cfgs:
56
+ desc: null
57
+ value:
58
+ model_name_or_path: /aifs4su/yaodong/models/Qwen2-VL-7B-Instruct
59
+ trust_remote_code: true
60
+ model_max_length: 4096
61
+ special_tokens:
62
+ desc: null
63
+ value: null
64
+ _wandb:
65
+ desc: null
66
+ value:
67
+ python_version: 3.11.9
68
+ cli_version: 0.17.5
69
+ framework: huggingface
70
+ huggingface_version: 4.45.0.dev0
71
+ is_jupyter_run: false
72
+ is_kaggle_kernel: false
73
+ start_time: 1726888342
74
+ t:
75
+ 1:
76
+ - 1
77
+ - 5
78
+ - 11
79
+ - 41
80
+ - 49
81
+ - 51
82
+ - 53
83
+ - 55
84
+ - 71
85
+ - 83
86
+ - 98
87
+ - 105
88
+ 2:
89
+ - 1
90
+ - 5
91
+ - 11
92
+ - 41
93
+ - 49
94
+ - 51
95
+ - 53
96
+ - 55
97
+ - 71
98
+ - 83
99
+ - 98
100
+ - 105
101
+ 3:
102
+ - 2
103
+ - 13
104
+ - 16
105
+ - 23
106
+ - 61
107
+ 4: 3.11.9
108
+ 5: 0.17.5
109
+ 6: 4.45.0.dev0
110
+ 8:
111
+ - 5
112
+ 13: linux-x86_64
wandb/run-20240921_111222-4ony16ec/files/output.log ADDED
@@ -0,0 +1,609 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+
2
+ ***** Running training *****
3
+
4
+ Training 1/3 epoch: 0%| | 0/531 [00:00<?, ?it/s]`use_cache=True` is incompatible with gradient checkpointing. Setting `use_cache=False`...
5
+ /aifs4su/yaodong/miniconda3/envs/hantao_tiv/lib/python3.11/site-packages/torch/utils/checkpoint.py:295: FutureWarning: `torch.cpu.amp.autocast(args...)` is deprecated. Please use `torch.amp.autocast('cpu', args...)` instead.
6
+ with torch.enable_grad(), device_autocast_ctx, torch.cpu.amp.autocast(**ctx.cpu_autocast_kwargs): # type: ignore[attr-defined]
7
+
8
+
9
+
10
+
11
+
12
+
13
+
14
+
15
+ Training 1/3 epoch (loss 0.8395): 2%|██▍ | 9/531 [01:14<1:12:50, 8.37s/it]
16
+
17
+
18
+
19
+
20
+
21
+
22
+
23
+
24
+
25
+
26
+ Training 1/3 epoch (loss 1.9732): 4%|█████ | 19/531 [02:31<1:13:02, 8.56s/it]
27
+
28
+
29
+
30
+
31
+
32
+
33
+
34
+
35
+
36
+
37
+ Training 1/3 epoch (loss 3.0771): 5%|███████▋ | 29/531 [03:48<1:01:33, 7.36s/it]
38
+
39
+
40
+
41
+
42
+
43
+
44
+
45
+
46
+
47
+
48
+ Training 1/3 epoch (loss 1.0346): 7%|██████████▎ | 39/531 [05:15<1:07:13, 8.20s/it]
49
+
50
+
51
+
52
+
53
+
54
+
55
+
56
+
57
+
58
+
59
+
60
+ Training 1/3 epoch (loss 0.4914): 9%|█████████████ | 49/531 [06:41<1:20:46, 10.05s/it]
61
+
62
+
63
+
64
+
65
+
66
+
67
+
68
+
69
+
70
+
71
+ Training 1/3 epoch (loss 1.4690): 11%|███████████████▉ | 59/531 [07:59<57:43, 7.34s/it]
72
+
73
+
74
+
75
+
76
+
77
+
78
+
79
+
80
+
81
+
82
+ Training 1/3 epoch (loss 0.6775): 13%|██████████████████▌ | 69/531 [09:22<59:22, 7.71s/it]
83
+
84
+
85
+
86
+
87
+
88
+
89
+
90
+
91
+
92
+
93
+ Training 1/3 epoch (loss 0.4325): 15%|████████████████████▉ | 79/531 [10:48<1:12:39, 9.65s/it]
94
+
95
+
96
+
97
+
98
+
99
+
100
+
101
+
102
+
103
+
104
+ Training 1/3 epoch (loss 1.0096): 17%|███████████████████████▋ | 89/531 [12:20<1:16:49, 10.43s/it]
105
+
106
+
107
+
108
+
109
+
110
+
111
+
112
+
113
+
114
+
115
+ Training 1/3 epoch (loss 0.2861): 19%|██████████████████████████▋ | 99/531 [13:40<57:03, 7.93s/it]
116
+
117
+
118
+
119
+
120
+
121
+
122
+
123
+
124
+
125
+
126
+ Training 1/3 epoch (loss 1.1329): 21%|█████████████████████████████▏ | 109/531 [14:58<57:58, 8.24s/it]
127
+
128
+
129
+
130
+
131
+
132
+
133
+
134
+
135
+
136
+
137
+ Training 1/3 epoch (loss 1.0573): 22%|███████████████████████████████▊ | 119/531 [16:27<56:45, 8.27s/it]
138
+
139
+
140
+
141
+
142
+
143
+
144
+
145
+
146
+
147
+
148
+ Training 1/3 epoch (loss 1.2254): 24%|██████████████████████████████████▍ | 129/531 [17:46<56:23, 8.42s/it]
149
+
150
+
151
+
152
+
153
+
154
+
155
+
156
+
157
+
158
+
159
+ Training 1/3 epoch (loss 0.2646): 26%|█████████████████████████████████████▏ | 139/531 [19:16<56:30, 8.65s/it]
160
+
161
+
162
+
163
+
164
+
165
+
166
+
167
+
168
+
169
+
170
+ Training 1/3 epoch (loss 0.2230): 28%|███████████████████████████████████████▊ | 149/531 [20:38<48:28, 7.61s/it]
171
+
172
+
173
+
174
+
175
+
176
+
177
+
178
+
179
+
180
+
181
+ Training 1/3 epoch (loss 1.6615): 30%|██████████████████████████████████████████▌ | 159/531 [21:57<47:14, 7.62s/it]
182
+
183
+
184
+
185
+
186
+
187
+
188
+
189
+
190
+
191
+
192
+ Training 1/3 epoch (loss 0.3717): 32%|█████████████████████████████████████████████▏ | 169/531 [23:20<49:05, 8.14s/it]
193
+
194
+
195
+
196
+
197
+
198
+
199
+
200
+
201
+
202
+
203
+ Training 2/3 epoch (loss 0.4366): 34%|███████████████████████████████████████████████▊ | 179/531 [24:48<47:02, 8.02s/it]
204
+
205
+
206
+
207
+
208
+
209
+
210
+
211
+
212
+
213
+
214
+ Training 2/3 epoch (loss 1.9746): 36%|██████████████████████████████████████████████████▌ | 189/531 [26:05<40:13, 7.06s/it]
215
+
216
+
217
+
218
+
219
+
220
+
221
+
222
+
223
+
224
+
225
+ Training 2/3 epoch (loss 0.9471): 37%|█████████████████████████████████████████████████████▏ | 199/531 [27:24<43:32, 7.87s/it]
226
+
227
+
228
+
229
+
230
+
231
+
232
+
233
+
234
+
235
+
236
+ Training 2/3 epoch (loss 0.5072): 39%|███████████████████████████████████████████████████████▉ | 209/531 [28:43<43:05, 8.03s/it]
237
+
238
+
239
+
240
+
241
+
242
+
243
+
244
+
245
+
246
+
247
+ Training 2/3 epoch (loss 0.2369): 41%|██████████████████████████████████████████████████████████▌ | 219/531 [30:08<39:52, 7.67s/it]
248
+
249
+
250
+
251
+
252
+
253
+
254
+
255
+
256
+
257
+
258
+ Training 2/3 epoch (loss 0.9289): 43%|█████████████████████████████████████████████████████████████▏ | 229/531 [31:38<46:09, 9.17s/it]
259
+
260
+
261
+
262
+
263
+
264
+
265
+
266
+
267
+
268
+
269
+ Training 2/3 epoch (loss 0.7007): 45%|███████████████████████████████████████████████████████████████▉ | 239/531 [32:51<34:44, 7.14s/it]
270
+
271
+
272
+
273
+
274
+
275
+
276
+
277
+
278
+
279
+
280
+ Training 2/3 epoch (loss 0.5656): 47%|██████████████████████████████████████████████████████████████████▌ | 249/531 [34:16<37:29, 7.98s/it]
281
+
282
+
283
+
284
+
285
+
286
+
287
+
288
+
289
+
290
+
291
+ Training 2/3 epoch (loss 0.3311): 49%|█████████████████████████████████████████████████████████████████████▎ | 259/531 [35:44<39:41, 8.75s/it]
292
+
293
+
294
+
295
+
296
+
297
+
298
+
299
+
300
+
301
+
302
+ Training 2/3 epoch (loss 0.2943): 51%|███████████████████████████████████████████████████████████████████████▉ | 269/531 [37:09<36:41, 8.40s/it]
303
+
304
+
305
+
306
+
307
+
308
+
309
+
310
+
311
+
312
+
313
+ Training 2/3 epoch (loss 0.6977): 53%|██████████████████████████████████████████████████████████████████████████▌ | 279/531 [38:28<31:36, 7.52s/it]
314
+
315
+
316
+
317
+
318
+
319
+
320
+
321
+
322
+
323
+
324
+ Training 2/3 epoch (loss 1.3606): 54%|█████████████████████████████████████████████████████████████████████████████▎ | 289/531 [39:52<35:27, 8.79s/it]
325
+
326
+
327
+
328
+
329
+
330
+
331
+
332
+
333
+
334
+
335
+ Training 2/3 epoch (loss 0.3531): 56%|███████████████████████████████████████████████████████████████████████████████▉ | 299/531 [41:15<28:46, 7.44s/it]
336
+
337
+
338
+
339
+
340
+
341
+
342
+
343
+
344
+
345
+
346
+ Training 2/3 epoch (loss 1.3322): 58%|██████████████████████████████████████████████████████████████████████████████████▋ | 309/531 [42:44<34:51, 9.42s/it]
347
+
348
+
349
+
350
+
351
+
352
+
353
+
354
+
355
+
356
+
357
+ Training 2/3 epoch (loss 0.3598): 60%|█████████████████████████████████████████████████████████████████████████████████████▎ | 319/531 [44:11<32:19, 9.15s/it]
358
+
359
+
360
+
361
+
362
+
363
+
364
+
365
+
366
+
367
+
368
+ Training 2/3 epoch (loss 0.3140): 62%|███████████████████████████████████████████████████████████████████████████████████████▉ | 329/531 [45:28<26:26, 7.85s/it]
369
+
370
+
371
+
372
+
373
+
374
+
375
+
376
+
377
+
378
+
379
+ Training 2/3 epoch (loss 0.4596): 64%|██████████████████████████████████████████████████████████████████████████████████████████▋ | 339/531 [46:45<23:37, 7.38s/it]
380
+
381
+
382
+
383
+
384
+
385
+
386
+
387
+
388
+
389
+
390
+ Training 2/3 epoch (loss 0.1021): 66%|█████████████████████████████████████████████████████████████████████████████████████████████▎ | 349/531 [48:14<26:38, 8.78s/it]
391
+
392
+
393
+
394
+
395
+
396
+
397
+
398
+
399
+
400
+
401
+ Training 3/3 epoch (loss 0.2287): 68%|████████████████████████████████████████████████████████████████████████████████████████████████ | 359/531 [49:34<22:19, 7.79s/it]
402
+
403
+
404
+
405
+
406
+
407
+
408
+
409
+
410
+
411
+
412
+ Training 3/3 epoch (loss 0.5106): 69%|██████████████████████████████████████████████████████████████████████████████████████████████████▋ | 369/531 [50:50<19:41, 7.29s/it]
413
+
414
+
415
+
416
+
417
+
418
+
419
+
420
+
421
+
422
+
423
+
424
+ Training 3/3 epoch (loss 0.1319): 71%|█████████████████████████████████████████████████████████████████████████████████████████████████████▎ | 379/531 [52:11<21:03, 8.31s/it]
425
+
426
+
427
+
428
+
429
+
430
+
431
+
432
+
433
+
434
+
435
+
436
+ Training 3/3 epoch (loss 0.1420): 73%|████████████████████████████████████████████████████████████████████████████████████████████████████████ | 389/531 [53:38<22:51, 9.66s/it]
437
+
438
+
439
+
440
+
441
+
442
+
443
+
444
+
445
+
446
+
447
+
448
+ Training 3/3 epoch (loss 0.5357): 75%|██████████████████████████████████████████████████████████████████████████████████████████████████████████▋ | 399/531 [54:56<17:25, 7.92s/it]
449
+
450
+
451
+
452
+
453
+
454
+
455
+
456
+
457
+
458
+
459
+ Training 3/3 epoch (loss 0.1835): 77%|█████████████████████████████████████████████████████████████████████████████████████████████████████████████▎ | 409/531 [56:25<16:15, 8.00s/it]
460
+
461
+
462
+
463
+
464
+
465
+
466
+
467
+
468
+
469
+
470
+ Training 3/3 epoch (loss 0.5765): 79%|████████████████████████████████████████████████████████████████████████████████████████████████████████████████ | 419/531 [57:47<19:40, 10.54s/it]
471
+
472
+
473
+
474
+
475
+
476
+
477
+
478
+
479
+
480
+
481
+ Training 3/3 epoch (loss 1.8443): 81%|██████████████████████████████████████████████████████████████████████████████████████████████████████████████████▋ | 429/531 [59:02<12:57, 7.62s/it]
482
+
483
+
484
+
485
+
486
+
487
+
488
+
489
+
490
+
491
+
492
+
493
+ Training 3/3 epoch (loss 0.2949): 83%|████████████████████████████████████████████████████████████████████████████████████████████████████████████████████ | 440/531 [1:00:38<12:14, 8.07s/it]
494
+
495
+
496
+
497
+
498
+
499
+
500
+
501
+
502
+
503
+ Training 3/3 epoch (loss 1.1613): 85%|██████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▍ | 449/531 [1:01:58<11:28, 8.40s/it]
504
+
505
+
506
+
507
+
508
+
509
+
510
+
511
+
512
+
513
+
514
+ Training 3/3 epoch (loss 0.2900): 86%|█████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████ | 459/531 [1:03:16<09:07, 7.61s/it]
515
+
516
+
517
+
518
+
519
+
520
+
521
+
522
+
523
+
524
+
525
+ Training 3/3 epoch (loss 0.2732): 88%|███████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▋ | 469/531 [1:04:46<09:23, 9.09s/it]
526
+
527
+
528
+
529
+
530
+
531
+
532
+
533
+
534
+
535
+
536
+ Training 3/3 epoch (loss 0.9524): 90%|██████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▎ | 479/531 [1:06:03<06:42, 7.73s/it]
537
+
538
+
539
+
540
+
541
+
542
+
543
+
544
+
545
+
546
+
547
+ Training 3/3 epoch (loss 0.5670): 92%|████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▉ | 489/531 [1:07:33<06:22, 9.11s/it]
548
+
549
+
550
+
551
+
552
+
553
+
554
+
555
+
556
+
557
+
558
+ Training 3/3 epoch (loss 0.3265): 94%|███████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▌ | 499/531 [1:08:57<04:22, 8.21s/it]
559
+
560
+
561
+
562
+
563
+
564
+
565
+
566
+
567
+
568
+
569
+
570
+ Training 3/3 epoch (loss 1.3381): 96%|██████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▍ | 510/531 [1:10:24<02:47, 7.96s/it]
571
+
572
+
573
+
574
+
575
+
576
+
577
+
578
+
579
+
580
+ Training 3/3 epoch (loss 0.2275): 98%|████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▊ | 519/531 [1:11:33<01:35, 7.93s/it]
581
+
582
+
583
+
584
+
585
+
586
+
587
+
588
+
589
+
590
+
591
+ Training 3/3 epoch (loss 0.7530): 100%|█████████���█████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▍| 529/531 [1:13:01<00:16, 8.38s/it]
592
+
593
+ Training 3/3 epoch (loss 0.1529): 100%|███████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████▋| 530/531 [1:13:11<00:08, 8.81s/it]
594
+ Saving model to "../outputs/dpo_tiv2t_1.5k_base" ...
595
+
596
+ Training 3/3 epoch (loss 0.4428): 100%|████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████| 531/531 [1:13:19<00:00, 8.28s/it]
597
+ [2024-09-21 12:25:55,184] [INFO] [logging.py:96:log_dist] [Rank 0] [Torch] Checkpoint global_step531 is about to be saved!
598
+ [2024-09-21 12:25:55,184] [INFO] [engine.py:3591:save_16bit_model] Saving model weights to ../outputs/dpo_tiv2t_1.5k_base/pytorch_model.bin, tag: global_step531
599
+ [2024-09-21 12:25:55,184] [INFO] [torch_checkpoint_engine.py:21:save] [Torch] Saving ../outputs/dpo_tiv2t_1.5k_base/pytorch_model.bin...
600
+ [2024-09-21 12:26:08,310] [INFO] [torch_checkpoint_engine.py:23:save] [Torch] Saved ../outputs/dpo_tiv2t_1.5k_base/pytorch_model.bin.
601
+ [2024-09-21 12:26:08,311] [INFO] [torch_checkpoint_engine.py:33:commit] [Torch] Checkpoint global_step531 is ready now!
602
+ Model saved!
603
+ Saving 16-bit model...
604
+ [2024-09-21 12:26:15,942] [INFO] [logging.py:96:log_dist] [Rank 0] [Torch] Checkpoint global_step531 is about to be saved!
605
+ [2024-09-21 12:26:15,943] [INFO] [engine.py:3591:save_16bit_model] Saving model weights to ../outputs/dpo_tiv2t_1.5k_base/pytorch_model.bin, tag: global_step531
606
+ [2024-09-21 12:26:15,943] [INFO] [torch_checkpoint_engine.py:21:save] [Torch] Saving ../outputs/dpo_tiv2t_1.5k_base/pytorch_model.bin...
607
+ [2024-09-21 12:26:31,191] [INFO] [torch_checkpoint_engine.py:23:save] [Torch] Saved ../outputs/dpo_tiv2t_1.5k_base/pytorch_model.bin.
608
+ [2024-09-21 12:26:31,192] [INFO] [torch_checkpoint_engine.py:33:commit] [Torch] Checkpoint global_step531 is ready now!
609
+ Model saved!
wandb/run-20240921_111222-4ony16ec/files/requirements.txt ADDED
@@ -0,0 +1,325 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ Brotli==1.1.0
2
+ GitPython==3.1.43
3
+ Jinja2==3.1.4
4
+ Markdown==3.6
5
+ MarkupSafe==2.1.5
6
+ PySocks==1.7.1
7
+ PyYAML==6.0.1
8
+ Pygments==2.18.0
9
+ Werkzeug==3.0.3
10
+ about-time==4.2.1
11
+ absl-py==2.1.0
12
+ accelerate==0.34.0
13
+ aiofiles==23.2.1
14
+ aiohttp-retry==2.8.3
15
+ aiohttp==3.9.5
16
+ aiosignal==1.3.1
17
+ align-anything==0.0.1.dev0
18
+ align-anything==0.0.1.dev0
19
+ alive-progress==3.1.5
20
+ amqp==5.2.0
21
+ annotated-types==0.7.0
22
+ antlr4-python3-runtime==4.9.3
23
+ anyio==4.4.0
24
+ appdirs==1.4.4
25
+ asttokens==2.4.1
26
+ asyncssh==2.16.0
27
+ atpublic==5.0
28
+ attrs==23.2.0
29
+ audioread==3.0.1
30
+ autocommand==2.2.2
31
+ backoff==2.2.1
32
+ backports.tarfile==1.2.0
33
+ billiard==4.2.0
34
+ boto3==1.35.9
35
+ botocore==1.35.9
36
+ cachetools==5.4.0
37
+ celery==5.4.0
38
+ certifi==2024.7.4
39
+ cffi==1.16.0
40
+ cfgv==3.4.0
41
+ charset-normalizer==3.3.2
42
+ click-didyoumean==0.3.1
43
+ click-plugins==1.1.1
44
+ click-repl==0.3.0
45
+ click==8.1.7
46
+ cloudpickle==3.0.0
47
+ cmake==3.30.1
48
+ colorama==0.4.6
49
+ comm==0.2.2
50
+ commonmark==0.9.1
51
+ configobj==5.0.8
52
+ contourpy==1.2.1
53
+ cryptography==43.0.0
54
+ cycler==0.12.1
55
+ dacite==1.6.0
56
+ dagshub-annotation-converter==0.1.0
57
+ dagshub==0.3.35
58
+ dataclasses-json==0.6.7
59
+ datasets==2.20.0
60
+ debugpy==1.8.2
61
+ decorator==4.4.2
62
+ deepspeed==0.14.4
63
+ dictdiffer==0.9.0
64
+ diffusers==0.29.2
65
+ dill==0.3.8
66
+ diskcache==5.6.3
67
+ distlib==0.3.8
68
+ distro==1.9.0
69
+ dnspython==2.6.1
70
+ docker-pycreds==0.4.0
71
+ docstring_parser==0.16
72
+ dpath==2.2.0
73
+ dulwich==0.22.1
74
+ dvc-data==3.16.5
75
+ dvc-http==2.32.0
76
+ dvc-objects==5.1.0
77
+ dvc-render==1.0.2
78
+ dvc-studio-client==0.21.0
79
+ dvc-task==0.4.0
80
+ dvc==3.55.1
81
+ einops==0.8.0
82
+ email_validator==2.2.0
83
+ entrypoints==0.4
84
+ exceptiongroup==1.2.2
85
+ executing==2.0.1
86
+ fastapi-cli==0.0.4
87
+ fastapi==0.111.1
88
+ ffmpy==0.3.3
89
+ filelock==3.15.4
90
+ fire==0.6.0
91
+ flatten-dict==0.4.2
92
+ flufl.lock==8.1.0
93
+ fonttools==4.53.1
94
+ frozenlist==1.4.1
95
+ fsspec==2024.5.0
96
+ funcy==2.0
97
+ fusepy==3.0.1
98
+ gitdb==4.0.11
99
+ gmpy2==2.1.5
100
+ gql==3.5.0
101
+ gradio==4.39.0
102
+ gradio_client==1.1.1
103
+ gradio_multimodalchatbot==0.0.1
104
+ grandalf==0.8
105
+ grapheme==0.6.0
106
+ graphql-core==3.2.3
107
+ grpcio==1.65.1
108
+ gto==1.7.1
109
+ h11==0.14.0
110
+ h2==4.1.0
111
+ hjson==3.1.0
112
+ hpack==4.0.0
113
+ httpcore==1.0.5
114
+ httptools==0.6.1
115
+ httpx==0.27.2
116
+ huggingface-hub==0.24.3
117
+ hydra-core==1.3.2
118
+ hyperframe==6.0.1
119
+ identify==2.6.0
120
+ idna==3.7
121
+ imageio-ffmpeg==0.5.1
122
+ imageio==2.35.1
123
+ importlib_metadata==8.0.0
124
+ importlib_metadata==8.2.0
125
+ importlib_resources==6.4.0
126
+ importlib_resources==6.4.0
127
+ inflect==7.3.1
128
+ iniconfig==2.0.0
129
+ interegular==0.3.3
130
+ ipykernel==6.29.5
131
+ ipython==8.26.0
132
+ iterative-telemetry==0.0.8
133
+ jaraco.context==5.3.0
134
+ jaraco.functools==4.0.1
135
+ jaraco.text==3.12.1
136
+ jedi==0.19.1
137
+ jmespath==1.0.1
138
+ joblib==1.4.2
139
+ jsonschema-specifications==2023.12.1
140
+ jsonschema==4.23.0
141
+ jupyter_client==8.6.2
142
+ jupyter_core==5.7.2
143
+ kiwisolver==1.4.5
144
+ kombu==5.4.0
145
+ lark==1.1.9
146
+ lazy_loader==0.4
147
+ librosa==0.10.2.post1
148
+ llamafactory==0.8.4.dev0
149
+ llamafactory==0.8.4.dev0
150
+ llvmlite==0.43.0
151
+ lm-format-enforcer==0.10.3
152
+ lxml==5.3.0
153
+ markdown-it-py==3.0.0
154
+ marshmallow==3.22.0
155
+ matplotlib-inline==0.1.7
156
+ matplotlib==3.9.1
157
+ mdurl==0.1.2
158
+ mmsg==0.1.dev14+gbd2b056.d20240803
159
+ more-itertools==10.3.0
160
+ moviepy==1.0.3
161
+ mpi4py==4.0.0
162
+ mpmath==1.3.0
163
+ msgpack==1.0.8
164
+ multidict==6.0.5
165
+ multiprocess==0.70.16
166
+ mypy-extensions==1.0.0
167
+ nest_asyncio==1.6.0
168
+ networkx==3.3
169
+ ninja==1.11.1.1
170
+ nodeenv==1.9.1
171
+ numba==0.60.0
172
+ numpy==1.26.4
173
+ nvidia-cublas-cu12==12.1.3.1
174
+ nvidia-cuda-cupti-cu12==12.1.105
175
+ nvidia-cuda-nvrtc-cu12==12.1.105
176
+ nvidia-cuda-runtime-cu12==12.1.105
177
+ nvidia-cudnn-cu12==8.9.2.26
178
+ nvidia-cufft-cu12==11.0.2.54
179
+ nvidia-curand-cu12==10.3.2.106
180
+ nvidia-cusolver-cu12==11.4.5.107
181
+ nvidia-cusparse-cu12==12.1.0.106
182
+ nvidia-ml-py==12.535.161
183
+ nvidia-nccl-cu12==2.20.5
184
+ nvidia-nvjitlink-cu12==12.5.82
185
+ nvidia-nvtx-cu12==12.1.105
186
+ nvitop==1.3.2
187
+ omegaconf==2.3.0
188
+ openai==1.37.1
189
+ optree==0.12.1
190
+ ordered-set==4.1.0
191
+ orjson==3.10.6
192
+ outlines==0.0.47.dev37+g26e2934
193
+ packaging==24.1
194
+ packaging==24.1
195
+ pandas==2.2.2
196
+ parso==0.8.4
197
+ pathspec==0.12.1
198
+ pathvalidate==3.0.0
199
+ peft==0.12.0
200
+ pexpect==4.9.0
201
+ pickleshare==0.7.5
202
+ pillow==10.4.0
203
+ pip==24.0
204
+ platformdirs==3.11.0
205
+ platformdirs==4.2.2
206
+ pluggy==1.5.0
207
+ pooch==1.8.2
208
+ pre-commit==3.8.0
209
+ proglog==0.1.10
210
+ prometheus-fastapi-instrumentator==7.0.0
211
+ prometheus_client==0.20.0
212
+ prompt_toolkit==3.0.47
213
+ protobuf==4.25.4
214
+ psutil==6.0.0
215
+ ptyprocess==0.7.0
216
+ pure_eval==0.2.3
217
+ py-cpuinfo==9.0.0
218
+ pyairports==2.1.1
219
+ pyarrow-hotfix==0.6
220
+ pyarrow==17.0.0
221
+ pyav==13.0.0
222
+ pycountry==24.6.1
223
+ pycparser==2.22
224
+ pydantic==2.8.2
225
+ pydantic_core==2.20.1
226
+ pydot==3.0.1
227
+ pydub==0.25.1
228
+ pygit2==1.15.1
229
+ pygtrie==2.5.0
230
+ pyparsing==3.1.2
231
+ pytest==8.3.2
232
+ python-dateutil==2.9.0
233
+ python-dateutil==2.9.0.post0
234
+ python-dotenv==1.0.1
235
+ python-multipart==0.0.9
236
+ pytz==2024.1
237
+ pyzmq==26.0.3
238
+ ranger-fm==1.9.3
239
+ ray==2.34.0
240
+ referencing==0.35.1
241
+ regex==2024.7.24
242
+ requests-toolbelt==1.0.0
243
+ requests==2.32.3
244
+ rfc3986==1.5.0
245
+ rich==13.1.0
246
+ rpds-py==0.19.1
247
+ ruamel.yaml.clib==0.2.8
248
+ ruamel.yaml==0.18.6
249
+ ruff==0.5.5
250
+ s3transfer==0.10.2
251
+ safetensors==0.4.3
252
+ scikit-learn==1.5.1
253
+ scipy==1.14.0
254
+ scmrepo==3.3.7
255
+ semantic-version==2.10.0
256
+ semver==3.0.2
257
+ sentencepiece==0.2.0
258
+ sentry-sdk==2.11.0
259
+ setproctitle==1.3.3
260
+ setuptools==71.0.4
261
+ shellingham==1.5.4
262
+ shortuuid==1.0.13
263
+ shtab==1.7.1
264
+ six==1.16.0
265
+ smmap==5.0.1
266
+ sniffio==1.3.1
267
+ soundfile==0.12.1
268
+ soxr==0.4.0
269
+ sqltrie==0.11.1
270
+ sse-starlette==2.1.3
271
+ stack-data==0.6.2
272
+ starlette==0.37.2
273
+ sympy==1.13.0
274
+ tabulate==0.9.0
275
+ tenacity==8.2.3
276
+ tensorboard-data-server==0.7.2
277
+ tensorboard==2.17.0
278
+ term-image==0.7.2
279
+ termcolor==2.4.0
280
+ threadpoolctl==3.5.0
281
+ tiktoken==0.7.0
282
+ tokenizers==0.19.1
283
+ tomli==2.0.1
284
+ tomlkit==0.12.0
285
+ torch==2.3.1
286
+ torch==2.4.0
287
+ torchaudio==2.4.0
288
+ torchvision==0.18.1
289
+ torchvision==0.19.0
290
+ tornado==6.4.1
291
+ tqdm==4.66.4
292
+ traitlets==5.14.3
293
+ transformers==4.45.0.dev0
294
+ treelib==1.6.4
295
+ triton==2.3.1
296
+ triton==3.0.0
297
+ trl==0.9.6
298
+ typeguard==4.3.0
299
+ typer==0.12.3
300
+ typing-inspect==0.9.0
301
+ typing_extensions==4.12.2
302
+ typing_extensions==4.12.2
303
+ tyro==0.8.10
304
+ tzdata==2024.1
305
+ urllib3==2.2.2
306
+ uvicorn==0.30.3
307
+ uvloop==0.19.0
308
+ vine==5.1.0
309
+ virtualenv==20.26.3
310
+ vllm-flash-attn==2.5.9.post1
311
+ vllm==0.5.3.post1
312
+ voluptuous==0.15.2
313
+ wandb==0.17.5
314
+ watchfiles==0.22.0
315
+ wcwidth==0.2.13
316
+ websockets==11.0.3
317
+ wheel==0.43.0
318
+ wheel==0.43.0
319
+ xformers==0.0.27
320
+ xxhash==3.4.1
321
+ yarl==1.9.4
322
+ zc.lockfile==3.0.post1
323
+ zipp==3.19.2
324
+ zipp==3.19.2
325
+ zstandard==0.23.0
wandb/run-20240921_111222-4ony16ec/files/wandb-metadata.json ADDED
@@ -0,0 +1,1215 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "os": "Linux-5.15.0-1040-nvidia-x86_64-with-glibc2.35",
3
+ "python": "3.11.9",
4
+ "heartbeatAt": "2024-09-21T03:12:23.935425",
5
+ "startedAt": "2024-09-21T03:12:22.874534",
6
+ "docker": null,
7
+ "cuda": null,
8
+ "args": [
9
+ "--local_rank=0",
10
+ "--model_name_or_path",
11
+ "/aifs4su/yaodong/models/Qwen2-VL-7B-Instruct",
12
+ "--train_datasets",
13
+ "/aifs4su/yaodong/datasets/aaa_dataset/TV2T-preference/extracted",
14
+ "--output_dir",
15
+ "../outputs/dpo_tiv2t_1.5k_base",
16
+ "--train_data_files",
17
+ "1.5k_clean_duplicate.json",
18
+ "--train_template",
19
+ "NExTQA_preference",
20
+ "--train_split",
21
+ "train",
22
+ "--per_device_train_batch_size",
23
+ "1",
24
+ "--per_device_eval_batch_size",
25
+ "1",
26
+ "--gradient_accumulation_steps",
27
+ "1"
28
+ ],
29
+ "state": "running",
30
+ "program": "-m align_anything.trainers.tiv_to_t.dpo",
31
+ "codePathLocal": null,
32
+ "git": {
33
+ "remote": "git@github.com-hantao:htlou/align-anything.git",
34
+ "commit": "9eff99b0ee34f7265b8a2e1824650634c898f654"
35
+ },
36
+ "email": "2200017789@stu.pku.edu.cn",
37
+ "root": "/aifs4su/yaodong/projects/hantao/dev_cham/align-anything",
38
+ "host": "dgx-119",
39
+ "username": "yangyaodong",
40
+ "executable": "/aifs4su/yaodong/miniconda3/envs/hantao_tiv/bin/python3.11",
41
+ "cpu_count": 112,
42
+ "cpu_count_logical": 224,
43
+ "cpu_freq": {
44
+ "current": 2064.1573660714284,
45
+ "min": 800.0,
46
+ "max": 3800.0
47
+ },
48
+ "cpu_freq_per_core": [
49
+ {
50
+ "current": 2000.0,
51
+ "min": 800.0,
52
+ "max": 3800.0
53
+ },
54
+ {
55
+ "current": 2000.0,
56
+ "min": 800.0,
57
+ "max": 3800.0
58
+ },
59
+ {
60
+ "current": 2000.0,
61
+ "min": 800.0,
62
+ "max": 3800.0
63
+ },
64
+ {
65
+ "current": 3799.996,
66
+ "min": 800.0,
67
+ "max": 3800.0
68
+ },
69
+ {
70
+ "current": 2000.0,
71
+ "min": 800.0,
72
+ "max": 3800.0
73
+ },
74
+ {
75
+ "current": 2000.0,
76
+ "min": 800.0,
77
+ "max": 3800.0
78
+ },
79
+ {
80
+ "current": 2000.0,
81
+ "min": 800.0,
82
+ "max": 3800.0
83
+ },
84
+ {
85
+ "current": 2000.0,
86
+ "min": 800.0,
87
+ "max": 3800.0
88
+ },
89
+ {
90
+ "current": 2000.0,
91
+ "min": 800.0,
92
+ "max": 3800.0
93
+ },
94
+ {
95
+ "current": 2000.0,
96
+ "min": 800.0,
97
+ "max": 3800.0
98
+ },
99
+ {
100
+ "current": 2000.0,
101
+ "min": 800.0,
102
+ "max": 3800.0
103
+ },
104
+ {
105
+ "current": 2000.0,
106
+ "min": 800.0,
107
+ "max": 3800.0
108
+ },
109
+ {
110
+ "current": 2000.0,
111
+ "min": 800.0,
112
+ "max": 3800.0
113
+ },
114
+ {
115
+ "current": 2000.0,
116
+ "min": 800.0,
117
+ "max": 3800.0
118
+ },
119
+ {
120
+ "current": 2000.0,
121
+ "min": 800.0,
122
+ "max": 3800.0
123
+ },
124
+ {
125
+ "current": 2000.0,
126
+ "min": 800.0,
127
+ "max": 3800.0
128
+ },
129
+ {
130
+ "current": 3800.0,
131
+ "min": 800.0,
132
+ "max": 3800.0
133
+ },
134
+ {
135
+ "current": 2000.0,
136
+ "min": 800.0,
137
+ "max": 3800.0
138
+ },
139
+ {
140
+ "current": 2000.0,
141
+ "min": 800.0,
142
+ "max": 3800.0
143
+ },
144
+ {
145
+ "current": 2000.0,
146
+ "min": 800.0,
147
+ "max": 3800.0
148
+ },
149
+ {
150
+ "current": 2000.0,
151
+ "min": 800.0,
152
+ "max": 3800.0
153
+ },
154
+ {
155
+ "current": 2000.0,
156
+ "min": 800.0,
157
+ "max": 3800.0
158
+ },
159
+ {
160
+ "current": 2000.0,
161
+ "min": 800.0,
162
+ "max": 3800.0
163
+ },
164
+ {
165
+ "current": 2000.0,
166
+ "min": 800.0,
167
+ "max": 3800.0
168
+ },
169
+ {
170
+ "current": 2000.0,
171
+ "min": 800.0,
172
+ "max": 3800.0
173
+ },
174
+ {
175
+ "current": 2000.0,
176
+ "min": 800.0,
177
+ "max": 3800.0
178
+ },
179
+ {
180
+ "current": 2000.0,
181
+ "min": 800.0,
182
+ "max": 3800.0
183
+ },
184
+ {
185
+ "current": 2000.0,
186
+ "min": 800.0,
187
+ "max": 3800.0
188
+ },
189
+ {
190
+ "current": 2000.0,
191
+ "min": 800.0,
192
+ "max": 3800.0
193
+ },
194
+ {
195
+ "current": 2000.0,
196
+ "min": 800.0,
197
+ "max": 3800.0
198
+ },
199
+ {
200
+ "current": 2000.0,
201
+ "min": 800.0,
202
+ "max": 3800.0
203
+ },
204
+ {
205
+ "current": 2000.0,
206
+ "min": 800.0,
207
+ "max": 3800.0
208
+ },
209
+ {
210
+ "current": 2000.0,
211
+ "min": 800.0,
212
+ "max": 3800.0
213
+ },
214
+ {
215
+ "current": 2000.0,
216
+ "min": 800.0,
217
+ "max": 3800.0
218
+ },
219
+ {
220
+ "current": 2000.0,
221
+ "min": 800.0,
222
+ "max": 3800.0
223
+ },
224
+ {
225
+ "current": 2000.0,
226
+ "min": 800.0,
227
+ "max": 3800.0
228
+ },
229
+ {
230
+ "current": 2000.0,
231
+ "min": 800.0,
232
+ "max": 3800.0
233
+ },
234
+ {
235
+ "current": 2000.0,
236
+ "min": 800.0,
237
+ "max": 3800.0
238
+ },
239
+ {
240
+ "current": 2000.0,
241
+ "min": 800.0,
242
+ "max": 3800.0
243
+ },
244
+ {
245
+ "current": 2000.0,
246
+ "min": 800.0,
247
+ "max": 3800.0
248
+ },
249
+ {
250
+ "current": 2000.0,
251
+ "min": 800.0,
252
+ "max": 3800.0
253
+ },
254
+ {
255
+ "current": 2000.0,
256
+ "min": 800.0,
257
+ "max": 3800.0
258
+ },
259
+ {
260
+ "current": 2000.0,
261
+ "min": 800.0,
262
+ "max": 3800.0
263
+ },
264
+ {
265
+ "current": 2000.0,
266
+ "min": 800.0,
267
+ "max": 3800.0
268
+ },
269
+ {
270
+ "current": 2000.0,
271
+ "min": 800.0,
272
+ "max": 3800.0
273
+ },
274
+ {
275
+ "current": 2000.0,
276
+ "min": 800.0,
277
+ "max": 3800.0
278
+ },
279
+ {
280
+ "current": 2000.0,
281
+ "min": 800.0,
282
+ "max": 3800.0
283
+ },
284
+ {
285
+ "current": 2000.0,
286
+ "min": 800.0,
287
+ "max": 3800.0
288
+ },
289
+ {
290
+ "current": 2000.0,
291
+ "min": 800.0,
292
+ "max": 3800.0
293
+ },
294
+ {
295
+ "current": 2000.0,
296
+ "min": 800.0,
297
+ "max": 3800.0
298
+ },
299
+ {
300
+ "current": 2000.0,
301
+ "min": 800.0,
302
+ "max": 3800.0
303
+ },
304
+ {
305
+ "current": 2000.0,
306
+ "min": 800.0,
307
+ "max": 3800.0
308
+ },
309
+ {
310
+ "current": 2000.0,
311
+ "min": 800.0,
312
+ "max": 3800.0
313
+ },
314
+ {
315
+ "current": 2000.0,
316
+ "min": 800.0,
317
+ "max": 3800.0
318
+ },
319
+ {
320
+ "current": 2000.0,
321
+ "min": 800.0,
322
+ "max": 3800.0
323
+ },
324
+ {
325
+ "current": 2000.0,
326
+ "min": 800.0,
327
+ "max": 3800.0
328
+ },
329
+ {
330
+ "current": 2000.0,
331
+ "min": 800.0,
332
+ "max": 3800.0
333
+ },
334
+ {
335
+ "current": 2000.0,
336
+ "min": 800.0,
337
+ "max": 3800.0
338
+ },
339
+ {
340
+ "current": 2000.0,
341
+ "min": 800.0,
342
+ "max": 3800.0
343
+ },
344
+ {
345
+ "current": 2000.0,
346
+ "min": 800.0,
347
+ "max": 3800.0
348
+ },
349
+ {
350
+ "current": 3800.003,
351
+ "min": 800.0,
352
+ "max": 3800.0
353
+ },
354
+ {
355
+ "current": 2000.0,
356
+ "min": 800.0,
357
+ "max": 3800.0
358
+ },
359
+ {
360
+ "current": 2000.0,
361
+ "min": 800.0,
362
+ "max": 3800.0
363
+ },
364
+ {
365
+ "current": 3800.003,
366
+ "min": 800.0,
367
+ "max": 3800.0
368
+ },
369
+ {
370
+ "current": 2000.0,
371
+ "min": 800.0,
372
+ "max": 3800.0
373
+ },
374
+ {
375
+ "current": 3800.003,
376
+ "min": 800.0,
377
+ "max": 3800.0
378
+ },
379
+ {
380
+ "current": 2000.0,
381
+ "min": 800.0,
382
+ "max": 3800.0
383
+ },
384
+ {
385
+ "current": 2000.0,
386
+ "min": 800.0,
387
+ "max": 3800.0
388
+ },
389
+ {
390
+ "current": 2000.0,
391
+ "min": 800.0,
392
+ "max": 3800.0
393
+ },
394
+ {
395
+ "current": 2000.0,
396
+ "min": 800.0,
397
+ "max": 3800.0
398
+ },
399
+ {
400
+ "current": 2000.0,
401
+ "min": 800.0,
402
+ "max": 3800.0
403
+ },
404
+ {
405
+ "current": 2000.0,
406
+ "min": 800.0,
407
+ "max": 3800.0
408
+ },
409
+ {
410
+ "current": 2000.0,
411
+ "min": 800.0,
412
+ "max": 3800.0
413
+ },
414
+ {
415
+ "current": 2000.0,
416
+ "min": 800.0,
417
+ "max": 3800.0
418
+ },
419
+ {
420
+ "current": 2000.0,
421
+ "min": 800.0,
422
+ "max": 3800.0
423
+ },
424
+ {
425
+ "current": 2000.0,
426
+ "min": 800.0,
427
+ "max": 3800.0
428
+ },
429
+ {
430
+ "current": 2000.0,
431
+ "min": 800.0,
432
+ "max": 3800.0
433
+ },
434
+ {
435
+ "current": 2000.0,
436
+ "min": 800.0,
437
+ "max": 3800.0
438
+ },
439
+ {
440
+ "current": 2000.0,
441
+ "min": 800.0,
442
+ "max": 3800.0
443
+ },
444
+ {
445
+ "current": 2000.0,
446
+ "min": 800.0,
447
+ "max": 3800.0
448
+ },
449
+ {
450
+ "current": 2000.0,
451
+ "min": 800.0,
452
+ "max": 3800.0
453
+ },
454
+ {
455
+ "current": 2000.0,
456
+ "min": 800.0,
457
+ "max": 3800.0
458
+ },
459
+ {
460
+ "current": 2000.0,
461
+ "min": 800.0,
462
+ "max": 3800.0
463
+ },
464
+ {
465
+ "current": 2000.0,
466
+ "min": 800.0,
467
+ "max": 3800.0
468
+ },
469
+ {
470
+ "current": 2000.0,
471
+ "min": 800.0,
472
+ "max": 3800.0
473
+ },
474
+ {
475
+ "current": 2000.0,
476
+ "min": 800.0,
477
+ "max": 3800.0
478
+ },
479
+ {
480
+ "current": 2000.0,
481
+ "min": 800.0,
482
+ "max": 3800.0
483
+ },
484
+ {
485
+ "current": 2000.0,
486
+ "min": 800.0,
487
+ "max": 3800.0
488
+ },
489
+ {
490
+ "current": 2000.0,
491
+ "min": 800.0,
492
+ "max": 3800.0
493
+ },
494
+ {
495
+ "current": 2000.0,
496
+ "min": 800.0,
497
+ "max": 3800.0
498
+ },
499
+ {
500
+ "current": 2000.0,
501
+ "min": 800.0,
502
+ "max": 3800.0
503
+ },
504
+ {
505
+ "current": 2000.0,
506
+ "min": 800.0,
507
+ "max": 3800.0
508
+ },
509
+ {
510
+ "current": 2000.0,
511
+ "min": 800.0,
512
+ "max": 3800.0
513
+ },
514
+ {
515
+ "current": 2000.0,
516
+ "min": 800.0,
517
+ "max": 3800.0
518
+ },
519
+ {
520
+ "current": 2000.0,
521
+ "min": 800.0,
522
+ "max": 3800.0
523
+ },
524
+ {
525
+ "current": 2000.0,
526
+ "min": 800.0,
527
+ "max": 3800.0
528
+ },
529
+ {
530
+ "current": 2000.0,
531
+ "min": 800.0,
532
+ "max": 3800.0
533
+ },
534
+ {
535
+ "current": 2000.0,
536
+ "min": 800.0,
537
+ "max": 3800.0
538
+ },
539
+ {
540
+ "current": 2000.0,
541
+ "min": 800.0,
542
+ "max": 3800.0
543
+ },
544
+ {
545
+ "current": 3800.0,
546
+ "min": 800.0,
547
+ "max": 3800.0
548
+ },
549
+ {
550
+ "current": 2000.0,
551
+ "min": 800.0,
552
+ "max": 3800.0
553
+ },
554
+ {
555
+ "current": 2000.0,
556
+ "min": 800.0,
557
+ "max": 3800.0
558
+ },
559
+ {
560
+ "current": 2000.0,
561
+ "min": 800.0,
562
+ "max": 3800.0
563
+ },
564
+ {
565
+ "current": 2000.0,
566
+ "min": 800.0,
567
+ "max": 3800.0
568
+ },
569
+ {
570
+ "current": 2000.0,
571
+ "min": 800.0,
572
+ "max": 3800.0
573
+ },
574
+ {
575
+ "current": 2000.0,
576
+ "min": 800.0,
577
+ "max": 3800.0
578
+ },
579
+ {
580
+ "current": 2000.0,
581
+ "min": 800.0,
582
+ "max": 3800.0
583
+ },
584
+ {
585
+ "current": 2000.0,
586
+ "min": 800.0,
587
+ "max": 3800.0
588
+ },
589
+ {
590
+ "current": 2000.0,
591
+ "min": 800.0,
592
+ "max": 3800.0
593
+ },
594
+ {
595
+ "current": 2000.0,
596
+ "min": 800.0,
597
+ "max": 3800.0
598
+ },
599
+ {
600
+ "current": 2000.0,
601
+ "min": 800.0,
602
+ "max": 3800.0
603
+ },
604
+ {
605
+ "current": 2000.0,
606
+ "min": 800.0,
607
+ "max": 3800.0
608
+ },
609
+ {
610
+ "current": 2000.0,
611
+ "min": 800.0,
612
+ "max": 3800.0
613
+ },
614
+ {
615
+ "current": 2000.0,
616
+ "min": 800.0,
617
+ "max": 3800.0
618
+ },
619
+ {
620
+ "current": 2000.0,
621
+ "min": 800.0,
622
+ "max": 3800.0
623
+ },
624
+ {
625
+ "current": 2000.0,
626
+ "min": 800.0,
627
+ "max": 3800.0
628
+ },
629
+ {
630
+ "current": 2000.0,
631
+ "min": 800.0,
632
+ "max": 3800.0
633
+ },
634
+ {
635
+ "current": 2000.0,
636
+ "min": 800.0,
637
+ "max": 3800.0
638
+ },
639
+ {
640
+ "current": 2000.0,
641
+ "min": 800.0,
642
+ "max": 3800.0
643
+ },
644
+ {
645
+ "current": 2000.0,
646
+ "min": 800.0,
647
+ "max": 3800.0
648
+ },
649
+ {
650
+ "current": 2000.0,
651
+ "min": 800.0,
652
+ "max": 3800.0
653
+ },
654
+ {
655
+ "current": 2000.0,
656
+ "min": 800.0,
657
+ "max": 3800.0
658
+ },
659
+ {
660
+ "current": 2000.0,
661
+ "min": 800.0,
662
+ "max": 3800.0
663
+ },
664
+ {
665
+ "current": 2000.0,
666
+ "min": 800.0,
667
+ "max": 3800.0
668
+ },
669
+ {
670
+ "current": 2000.0,
671
+ "min": 800.0,
672
+ "max": 3800.0
673
+ },
674
+ {
675
+ "current": 2000.0,
676
+ "min": 800.0,
677
+ "max": 3800.0
678
+ },
679
+ {
680
+ "current": 2000.0,
681
+ "min": 800.0,
682
+ "max": 3800.0
683
+ },
684
+ {
685
+ "current": 2000.0,
686
+ "min": 800.0,
687
+ "max": 3800.0
688
+ },
689
+ {
690
+ "current": 2000.0,
691
+ "min": 800.0,
692
+ "max": 3800.0
693
+ },
694
+ {
695
+ "current": 2000.0,
696
+ "min": 800.0,
697
+ "max": 3800.0
698
+ },
699
+ {
700
+ "current": 2000.0,
701
+ "min": 800.0,
702
+ "max": 3800.0
703
+ },
704
+ {
705
+ "current": 2000.0,
706
+ "min": 800.0,
707
+ "max": 3800.0
708
+ },
709
+ {
710
+ "current": 2000.0,
711
+ "min": 800.0,
712
+ "max": 3800.0
713
+ },
714
+ {
715
+ "current": 2000.0,
716
+ "min": 800.0,
717
+ "max": 3800.0
718
+ },
719
+ {
720
+ "current": 2000.0,
721
+ "min": 800.0,
722
+ "max": 3800.0
723
+ },
724
+ {
725
+ "current": 2000.0,
726
+ "min": 800.0,
727
+ "max": 3800.0
728
+ },
729
+ {
730
+ "current": 2000.0,
731
+ "min": 800.0,
732
+ "max": 3800.0
733
+ },
734
+ {
735
+ "current": 2000.0,
736
+ "min": 800.0,
737
+ "max": 3800.0
738
+ },
739
+ {
740
+ "current": 2000.0,
741
+ "min": 800.0,
742
+ "max": 3800.0
743
+ },
744
+ {
745
+ "current": 2000.0,
746
+ "min": 800.0,
747
+ "max": 3800.0
748
+ },
749
+ {
750
+ "current": 2000.0,
751
+ "min": 800.0,
752
+ "max": 3800.0
753
+ },
754
+ {
755
+ "current": 2000.0,
756
+ "min": 800.0,
757
+ "max": 3800.0
758
+ },
759
+ {
760
+ "current": 2000.0,
761
+ "min": 800.0,
762
+ "max": 3800.0
763
+ },
764
+ {
765
+ "current": 2000.0,
766
+ "min": 800.0,
767
+ "max": 3800.0
768
+ },
769
+ {
770
+ "current": 2000.0,
771
+ "min": 800.0,
772
+ "max": 3800.0
773
+ },
774
+ {
775
+ "current": 2000.0,
776
+ "min": 800.0,
777
+ "max": 3800.0
778
+ },
779
+ {
780
+ "current": 2000.0,
781
+ "min": 800.0,
782
+ "max": 3800.0
783
+ },
784
+ {
785
+ "current": 2000.0,
786
+ "min": 800.0,
787
+ "max": 3800.0
788
+ },
789
+ {
790
+ "current": 2000.0,
791
+ "min": 800.0,
792
+ "max": 3800.0
793
+ },
794
+ {
795
+ "current": 2000.0,
796
+ "min": 800.0,
797
+ "max": 3800.0
798
+ },
799
+ {
800
+ "current": 2000.0,
801
+ "min": 800.0,
802
+ "max": 3800.0
803
+ },
804
+ {
805
+ "current": 2000.0,
806
+ "min": 800.0,
807
+ "max": 3800.0
808
+ },
809
+ {
810
+ "current": 2000.0,
811
+ "min": 800.0,
812
+ "max": 3800.0
813
+ },
814
+ {
815
+ "current": 2000.0,
816
+ "min": 800.0,
817
+ "max": 3800.0
818
+ },
819
+ {
820
+ "current": 2000.0,
821
+ "min": 800.0,
822
+ "max": 3800.0
823
+ },
824
+ {
825
+ "current": 2000.0,
826
+ "min": 800.0,
827
+ "max": 3800.0
828
+ },
829
+ {
830
+ "current": 2000.0,
831
+ "min": 800.0,
832
+ "max": 3800.0
833
+ },
834
+ {
835
+ "current": 2000.0,
836
+ "min": 800.0,
837
+ "max": 3800.0
838
+ },
839
+ {
840
+ "current": 2000.0,
841
+ "min": 800.0,
842
+ "max": 3800.0
843
+ },
844
+ {
845
+ "current": 2000.0,
846
+ "min": 800.0,
847
+ "max": 3800.0
848
+ },
849
+ {
850
+ "current": 2000.0,
851
+ "min": 800.0,
852
+ "max": 3800.0
853
+ },
854
+ {
855
+ "current": 2000.0,
856
+ "min": 800.0,
857
+ "max": 3800.0
858
+ },
859
+ {
860
+ "current": 2000.0,
861
+ "min": 800.0,
862
+ "max": 3800.0
863
+ },
864
+ {
865
+ "current": 2000.0,
866
+ "min": 800.0,
867
+ "max": 3800.0
868
+ },
869
+ {
870
+ "current": 2000.0,
871
+ "min": 800.0,
872
+ "max": 3800.0
873
+ },
874
+ {
875
+ "current": 2000.0,
876
+ "min": 800.0,
877
+ "max": 3800.0
878
+ },
879
+ {
880
+ "current": 2000.0,
881
+ "min": 800.0,
882
+ "max": 3800.0
883
+ },
884
+ {
885
+ "current": 2000.0,
886
+ "min": 800.0,
887
+ "max": 3800.0
888
+ },
889
+ {
890
+ "current": 3800.0,
891
+ "min": 800.0,
892
+ "max": 3800.0
893
+ },
894
+ {
895
+ "current": 2000.0,
896
+ "min": 800.0,
897
+ "max": 3800.0
898
+ },
899
+ {
900
+ "current": 2000.0,
901
+ "min": 800.0,
902
+ "max": 3800.0
903
+ },
904
+ {
905
+ "current": 3800.0,
906
+ "min": 800.0,
907
+ "max": 3800.0
908
+ },
909
+ {
910
+ "current": 2000.0,
911
+ "min": 800.0,
912
+ "max": 3800.0
913
+ },
914
+ {
915
+ "current": 2000.0,
916
+ "min": 800.0,
917
+ "max": 3800.0
918
+ },
919
+ {
920
+ "current": 2000.0,
921
+ "min": 800.0,
922
+ "max": 3800.0
923
+ },
924
+ {
925
+ "current": 2000.0,
926
+ "min": 800.0,
927
+ "max": 3800.0
928
+ },
929
+ {
930
+ "current": 2000.0,
931
+ "min": 800.0,
932
+ "max": 3800.0
933
+ },
934
+ {
935
+ "current": 2000.0,
936
+ "min": 800.0,
937
+ "max": 3800.0
938
+ },
939
+ {
940
+ "current": 2000.0,
941
+ "min": 800.0,
942
+ "max": 3800.0
943
+ },
944
+ {
945
+ "current": 2000.0,
946
+ "min": 800.0,
947
+ "max": 3800.0
948
+ },
949
+ {
950
+ "current": 2000.0,
951
+ "min": 800.0,
952
+ "max": 3800.0
953
+ },
954
+ {
955
+ "current": 2000.0,
956
+ "min": 800.0,
957
+ "max": 3800.0
958
+ },
959
+ {
960
+ "current": 2000.0,
961
+ "min": 800.0,
962
+ "max": 3800.0
963
+ },
964
+ {
965
+ "current": 2000.0,
966
+ "min": 800.0,
967
+ "max": 3800.0
968
+ },
969
+ {
970
+ "current": 2000.0,
971
+ "min": 800.0,
972
+ "max": 3800.0
973
+ },
974
+ {
975
+ "current": 2000.0,
976
+ "min": 800.0,
977
+ "max": 3800.0
978
+ },
979
+ {
980
+ "current": 2000.0,
981
+ "min": 800.0,
982
+ "max": 3800.0
983
+ },
984
+ {
985
+ "current": 2000.0,
986
+ "min": 800.0,
987
+ "max": 3800.0
988
+ },
989
+ {
990
+ "current": 2000.0,
991
+ "min": 800.0,
992
+ "max": 3800.0
993
+ },
994
+ {
995
+ "current": 2000.0,
996
+ "min": 800.0,
997
+ "max": 3800.0
998
+ },
999
+ {
1000
+ "current": 2000.0,
1001
+ "min": 800.0,
1002
+ "max": 3800.0
1003
+ },
1004
+ {
1005
+ "current": 2000.0,
1006
+ "min": 800.0,
1007
+ "max": 3800.0
1008
+ },
1009
+ {
1010
+ "current": 2000.0,
1011
+ "min": 800.0,
1012
+ "max": 3800.0
1013
+ },
1014
+ {
1015
+ "current": 2000.0,
1016
+ "min": 800.0,
1017
+ "max": 3800.0
1018
+ },
1019
+ {
1020
+ "current": 2000.0,
1021
+ "min": 800.0,
1022
+ "max": 3800.0
1023
+ },
1024
+ {
1025
+ "current": 2000.0,
1026
+ "min": 800.0,
1027
+ "max": 3800.0
1028
+ },
1029
+ {
1030
+ "current": 2000.0,
1031
+ "min": 800.0,
1032
+ "max": 3800.0
1033
+ },
1034
+ {
1035
+ "current": 2000.0,
1036
+ "min": 800.0,
1037
+ "max": 3800.0
1038
+ },
1039
+ {
1040
+ "current": 2000.0,
1041
+ "min": 800.0,
1042
+ "max": 3800.0
1043
+ },
1044
+ {
1045
+ "current": 2000.0,
1046
+ "min": 800.0,
1047
+ "max": 3800.0
1048
+ },
1049
+ {
1050
+ "current": 2000.0,
1051
+ "min": 800.0,
1052
+ "max": 3800.0
1053
+ },
1054
+ {
1055
+ "current": 2000.0,
1056
+ "min": 800.0,
1057
+ "max": 3800.0
1058
+ },
1059
+ {
1060
+ "current": 2000.0,
1061
+ "min": 800.0,
1062
+ "max": 3800.0
1063
+ },
1064
+ {
1065
+ "current": 2000.0,
1066
+ "min": 800.0,
1067
+ "max": 3800.0
1068
+ },
1069
+ {
1070
+ "current": 2000.0,
1071
+ "min": 800.0,
1072
+ "max": 3800.0
1073
+ },
1074
+ {
1075
+ "current": 2000.0,
1076
+ "min": 800.0,
1077
+ "max": 3800.0
1078
+ },
1079
+ {
1080
+ "current": 2000.0,
1081
+ "min": 800.0,
1082
+ "max": 3800.0
1083
+ },
1084
+ {
1085
+ "current": 2000.0,
1086
+ "min": 800.0,
1087
+ "max": 3800.0
1088
+ },
1089
+ {
1090
+ "current": 2000.0,
1091
+ "min": 800.0,
1092
+ "max": 3800.0
1093
+ },
1094
+ {
1095
+ "current": 2000.0,
1096
+ "min": 800.0,
1097
+ "max": 3800.0
1098
+ },
1099
+ {
1100
+ "current": 2000.0,
1101
+ "min": 800.0,
1102
+ "max": 3800.0
1103
+ },
1104
+ {
1105
+ "current": 2000.0,
1106
+ "min": 800.0,
1107
+ "max": 3800.0
1108
+ },
1109
+ {
1110
+ "current": 2000.0,
1111
+ "min": 800.0,
1112
+ "max": 3800.0
1113
+ },
1114
+ {
1115
+ "current": 2000.0,
1116
+ "min": 800.0,
1117
+ "max": 3800.0
1118
+ },
1119
+ {
1120
+ "current": 2000.0,
1121
+ "min": 800.0,
1122
+ "max": 3800.0
1123
+ },
1124
+ {
1125
+ "current": 2000.0,
1126
+ "min": 800.0,
1127
+ "max": 3800.0
1128
+ },
1129
+ {
1130
+ "current": 2000.0,
1131
+ "min": 800.0,
1132
+ "max": 3800.0
1133
+ },
1134
+ {
1135
+ "current": 2000.0,
1136
+ "min": 800.0,
1137
+ "max": 3800.0
1138
+ },
1139
+ {
1140
+ "current": 2000.0,
1141
+ "min": 800.0,
1142
+ "max": 3800.0
1143
+ },
1144
+ {
1145
+ "current": 2000.0,
1146
+ "min": 800.0,
1147
+ "max": 3800.0
1148
+ },
1149
+ {
1150
+ "current": 2000.0,
1151
+ "min": 800.0,
1152
+ "max": 3800.0
1153
+ },
1154
+ {
1155
+ "current": 2000.0,
1156
+ "min": 800.0,
1157
+ "max": 3800.0
1158
+ },
1159
+ {
1160
+ "current": 2000.0,
1161
+ "min": 800.0,
1162
+ "max": 3800.0
1163
+ },
1164
+ {
1165
+ "current": 2000.0,
1166
+ "min": 800.0,
1167
+ "max": 3800.0
1168
+ }
1169
+ ],
1170
+ "disk": {
1171
+ "/": {
1172
+ "total": 1758.8549690246582,
1173
+ "used": 14.712554931640625
1174
+ }
1175
+ },
1176
+ "gpu": "NVIDIA H800",
1177
+ "gpu_count": 8,
1178
+ "gpu_devices": [
1179
+ {
1180
+ "name": "NVIDIA H800",
1181
+ "memory_total": 85520809984
1182
+ },
1183
+ {
1184
+ "name": "NVIDIA H800",
1185
+ "memory_total": 85520809984
1186
+ },
1187
+ {
1188
+ "name": "NVIDIA H800",
1189
+ "memory_total": 85520809984
1190
+ },
1191
+ {
1192
+ "name": "NVIDIA H800",
1193
+ "memory_total": 85520809984
1194
+ },
1195
+ {
1196
+ "name": "NVIDIA H800",
1197
+ "memory_total": 85520809984
1198
+ },
1199
+ {
1200
+ "name": "NVIDIA H800",
1201
+ "memory_total": 85520809984
1202
+ },
1203
+ {
1204
+ "name": "NVIDIA H800",
1205
+ "memory_total": 85520809984
1206
+ },
1207
+ {
1208
+ "name": "NVIDIA H800",
1209
+ "memory_total": 85520809984
1210
+ }
1211
+ ],
1212
+ "memory": {
1213
+ "total": 2015.5641632080078
1214
+ }
1215
+ }
wandb/run-20240921_111222-4ony16ec/files/wandb-summary.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"train/step": 531, "train/loss": 0.44282472133636475, "train/reward": -21.30280303955078, "train/better_sample_reward": -8.71082878112793, "train/worse_sample_reward": -12.591974258422852, "train/reward_accuracy": 0.875, "train/reward_margin": 3.8811450004577637, "train/lr": 0.0, "train/epoch": 3.0, "_timestamp": 1726892746.5268066, "_runtime": 4403.641909599304, "_step": 531, "_wandb": {"runtime": 4447}}
wandb/run-20240921_111222-4ony16ec/logs/debug-internal.log ADDED
The diff for this file is too large to render. See raw diff
 
wandb/run-20240921_111222-4ony16ec/logs/debug.log ADDED
@@ -0,0 +1,36 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ 2024-09-21 11:12:22,880 INFO MainThread:2809147 [wandb_setup.py:_flush():76] Current SDK version is 0.17.5
2
+ 2024-09-21 11:12:22,882 INFO MainThread:2809147 [wandb_setup.py:_flush():76] Configure stats pid to 2809147
3
+ 2024-09-21 11:12:22,882 INFO MainThread:2809147 [wandb_setup.py:_flush():76] Loading settings from /home/yangyaodong/.config/wandb/settings
4
+ 2024-09-21 11:12:22,882 INFO MainThread:2809147 [wandb_setup.py:_flush():76] Loading settings from /aifs4su/yaodong/projects/hantao/dev_cham/align-anything/scripts/wandb/settings
5
+ 2024-09-21 11:12:22,882 INFO MainThread:2809147 [wandb_setup.py:_flush():76] Loading settings from environment variables: {'api_key': '***REDACTED***'}
6
+ 2024-09-21 11:12:22,882 INFO MainThread:2809147 [wandb_setup.py:_flush():76] Applying setup settings: {'_disable_service': False}
7
+ 2024-09-21 11:12:22,882 WARNING MainThread:2809147 [wandb_setup.py:_flush():76] Could not find program at -m align_anything.trainers.tiv_to_t.dpo
8
+ 2024-09-21 11:12:22,882 INFO MainThread:2809147 [wandb_setup.py:_flush():76] Inferring run settings from compute environment: {'program_relpath': None, 'program': '-m align_anything.trainers.tiv_to_t.dpo'}
9
+ 2024-09-21 11:12:22,882 INFO MainThread:2809147 [wandb_setup.py:_flush():76] Applying login settings: {}
10
+ 2024-09-21 11:12:22,882 INFO MainThread:2809147 [wandb_init.py:_log_setup():529] Logging user logs to ../outputs/dpo_tiv2t_1.5k_base/wandb/run-20240921_111222-4ony16ec/logs/debug.log
11
+ 2024-09-21 11:12:22,882 INFO MainThread:2809147 [wandb_init.py:_log_setup():530] Logging internal logs to ../outputs/dpo_tiv2t_1.5k_base/wandb/run-20240921_111222-4ony16ec/logs/debug-internal.log
12
+ 2024-09-21 11:12:22,882 INFO MainThread:2809147 [wandb_init.py:init():569] calling init triggers
13
+ 2024-09-21 11:12:22,882 INFO MainThread:2809147 [wandb_init.py:init():576] wandb.init called with sweep_config: {}
14
+ config: {'train_cfgs': {'ds_cfgs': 'ds_z3_config.json', 'epochs': 3, 'seed': 42, 'per_device_train_batch_size': 1.0, 'per_device_eval_batch_size': 1.0, 'gradient_accumulation_steps': 1.0, 'gradient_checkpointing': True, 'learning_rate': 1e-06, 'lr_scheduler_type': 'cosine', 'lr_warmup_ratio': 0.01, 'weight_decay': 0.0, 'adam_betas': [0.9, 0.95], 'bf16': True, 'fp16': False, 'eval_strategy': 'epoch', 'eval_interval': 10, 'regularization': 0.001, 'scale_coeff': 0.1, 'freeze_mm_proj': False, 'freeze_vision_tower': True, 'freeze_language_model': False}, 'data_cfgs': {'train_datasets': '/aifs4su/yaodong/datasets/aaa_dataset/TV2T-preference/extracted', 'train_template': 'NExTQA_preference', 'train_size': None, 'train_split': 'train', 'train_subset': None, 'train_data_files': '1.5k_clean_duplicate.json', 'train_optional_args': [], 'eval_datasets': None, 'eval_template': None, 'eval_size': None, 'eval_split': None, 'eval_subset': None, 'eval_data_files': None, 'eval_optional_args': []}, 'logger_cfgs': {'log_type': 'wandb', 'log_project': 'align-anything', 'log_run_name': 'dpo', 'output_dir': '../outputs/dpo_tiv2t_1.5k_base', 'cache_dir': None, 'save_interval': 100000}, 'model_cfgs': {'model_name_or_path': '/aifs4su/yaodong/models/Qwen2-VL-7B-Instruct', 'trust_remote_code': True, 'model_max_length': 4096}, 'special_tokens': None}
15
+ 2024-09-21 11:12:22,882 INFO MainThread:2809147 [wandb_init.py:init():619] starting backend
16
+ 2024-09-21 11:12:22,882 INFO MainThread:2809147 [wandb_init.py:init():623] setting up manager
17
+ 2024-09-21 11:12:22,883 INFO MainThread:2809147 [backend.py:_multiprocessing_setup():105] multiprocessing start_methods=fork,spawn,forkserver, using: spawn
18
+ 2024-09-21 11:12:22,884 INFO MainThread:2809147 [wandb_init.py:init():631] backend started and connected
19
+ 2024-09-21 11:12:22,886 INFO MainThread:2809147 [wandb_init.py:init():720] updated telemetry
20
+ 2024-09-21 11:12:22,897 INFO MainThread:2809147 [wandb_init.py:init():753] communicating run to backend with 90.0 second timeout
21
+ 2024-09-21 11:12:23,613 INFO MainThread:2809147 [wandb_run.py:_on_init():2435] communicating current version
22
+ 2024-09-21 11:12:23,800 INFO MainThread:2809147 [wandb_run.py:_on_init():2444] got version response upgrade_message: "wandb version 0.18.1 is available! To upgrade, please run:\n $ pip install wandb --upgrade"
23
+
24
+ 2024-09-21 11:12:23,801 INFO MainThread:2809147 [wandb_init.py:init():804] starting run threads in backend
25
+ 2024-09-21 11:12:27,363 INFO MainThread:2809147 [wandb_run.py:_console_start():2413] atexit reg
26
+ 2024-09-21 11:12:27,363 INFO MainThread:2809147 [wandb_run.py:_redirect():2255] redirect: wrap_raw
27
+ 2024-09-21 11:12:27,363 INFO MainThread:2809147 [wandb_run.py:_redirect():2320] Wrapping output streams.
28
+ 2024-09-21 11:12:27,363 INFO MainThread:2809147 [wandb_run.py:_redirect():2345] Redirects installed.
29
+ 2024-09-21 11:12:27,366 INFO MainThread:2809147 [wandb_init.py:init():847] run started, returning control to user process
30
+ 2024-09-21 12:26:31,218 INFO MainThread:2809147 [wandb_run.py:_finish():2107] finishing run htlou/align-anything/4ony16ec
31
+ 2024-09-21 12:26:31,219 INFO MainThread:2809147 [wandb_run.py:_atexit_cleanup():2374] got exitcode: 0
32
+ 2024-09-21 12:26:31,220 INFO MainThread:2809147 [wandb_run.py:_restore():2352] restore
33
+ 2024-09-21 12:26:31,220 INFO MainThread:2809147 [wandb_run.py:_restore():2358] restore done
34
+ 2024-09-21 12:26:37,117 INFO MainThread:2809147 [wandb_run.py:_footer_history_summary_info():4016] rendering history
35
+ 2024-09-21 12:26:37,118 INFO MainThread:2809147 [wandb_run.py:_footer_history_summary_info():4048] rendering summary
36
+ 2024-09-21 12:26:37,124 INFO MainThread:2809147 [wandb_run.py:_footer_sync_info():3975] logging synced files
wandb/run-20240921_111222-4ony16ec/run-4ony16ec.wandb ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7085eba7772eb3cb6852a78cee03b387b08c5574027a7013d650e477e9adcbad
3
+ size 1984316
wandb/run-20240921_115259-p9bvnzls/files/conda-environment.yaml ADDED
@@ -0,0 +1,516 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ name: hantao_tiv
2
+ channels:
3
+ - nvidia/label/cuda-12.1.0
4
+ - nvidia
5
+ - pytorch
6
+ - huggingface
7
+ - conda-forge
8
+ - defaults
9
+ dependencies:
10
+ - _libgcc_mutex=0.1=conda_forge
11
+ - _openmp_mutex=4.5=2_gnu
12
+ - aom=3.9.1=hac33072_0
13
+ - asttokens=2.4.1=pyhd8ed1ab_0
14
+ - blas=1.0=mkl
15
+ - brotli-python=1.1.0=py311hb755f60_1
16
+ - bzip2=1.0.8=h4bc722e_7
17
+ - ca-certificates=2024.7.4=hbcca054_0
18
+ - cairo=1.18.0=hebfffa5_3
19
+ - certifi=2024.7.4=pyhd8ed1ab_0
20
+ - cffi=1.16.0=py311hb3a22ac_0
21
+ - charset-normalizer=3.3.2=pyhd8ed1ab_0
22
+ - comm=0.2.2=pyhd8ed1ab_0
23
+ - cuda=12.1.0=0
24
+ - cuda-cccl=12.1.55=0
25
+ - cuda-command-line-tools=12.1.0=0
26
+ - cuda-compiler=12.1.0=0
27
+ - cuda-cudart=12.1.55=0
28
+ - cuda-cudart-dev=12.1.55=0
29
+ - cuda-cudart-static=12.1.55=0
30
+ - cuda-cuobjdump=12.1.55=0
31
+ - cuda-cupti=12.1.62=0
32
+ - cuda-cupti-static=12.1.62=0
33
+ - cuda-cuxxfilt=12.1.55=0
34
+ - cuda-demo-suite=12.1.55=0
35
+ - cuda-documentation=12.1.55=0
36
+ - cuda-driver-dev=12.1.55=0
37
+ - cuda-gdb=12.1.55=0
38
+ - cuda-libraries=12.1.0=0
39
+ - cuda-libraries-dev=12.1.0=0
40
+ - cuda-libraries-static=12.1.0=0
41
+ - cuda-nsight=12.1.55=0
42
+ - cuda-nsight-compute=12.1.0=0
43
+ - cuda-nvcc=12.1.66=0
44
+ - cuda-nvdisasm=12.1.55=0
45
+ - cuda-nvml-dev=12.1.55=0
46
+ - cuda-nvprof=12.1.55=0
47
+ - cuda-nvprune=12.1.55=0
48
+ - cuda-nvrtc=12.1.55=0
49
+ - cuda-nvrtc-dev=12.1.55=0
50
+ - cuda-nvrtc-static=12.1.55=0
51
+ - cuda-nvtx=12.1.66=0
52
+ - cuda-nvvp=12.1.55=0
53
+ - cuda-opencl=12.1.56=0
54
+ - cuda-opencl-dev=12.1.56=0
55
+ - cuda-profiler-api=12.1.55=0
56
+ - cuda-runtime=12.1.0=0
57
+ - cuda-sanitizer-api=12.1.55=0
58
+ - cuda-toolkit=12.1.0=0
59
+ - cuda-tools=12.1.0=0
60
+ - cuda-visual-tools=12.1.0=0
61
+ - dav1d=1.2.1=hd590300_0
62
+ - debugpy=1.8.2=py311h4332511_0
63
+ - exceptiongroup=1.2.2=pyhd8ed1ab_0
64
+ - executing=2.0.1=pyhd8ed1ab_0
65
+ - expat=2.6.2=h59595ed_0
66
+ - ffmpeg=7.0.1=gpl_h9be9148_104
67
+ - filelock=3.15.4=pyhd8ed1ab_0
68
+ - font-ttf-dejavu-sans-mono=2.37=hab24e00_0
69
+ - font-ttf-inconsolata=3.000=h77eed37_0
70
+ - font-ttf-source-code-pro=2.038=h77eed37_0
71
+ - font-ttf-ubuntu=0.83=h77eed37_2
72
+ - fontconfig=2.14.2=h14ed4e7_0
73
+ - fonts-conda-ecosystem=1=0
74
+ - fonts-conda-forge=1=0
75
+ - freetype=2.12.1=h267a509_2
76
+ - fribidi=1.0.10=h36c2ea0_0
77
+ - gds-tools=1.6.0.25=0
78
+ - gettext=0.22.5=h59595ed_2
79
+ - gettext-tools=0.22.5=h59595ed_2
80
+ - git-lfs=3.5.1=ha770c72_0
81
+ - gmp=6.3.0=hac33072_2
82
+ - gmpy2=2.1.5=py311hc4f1f91_1
83
+ - gnutls=3.7.9=hb077bed_0
84
+ - graphite2=1.3.13=h59595ed_1003
85
+ - h2=4.1.0=pyhd8ed1ab_0
86
+ - harfbuzz=9.0.0=hda332d3_1
87
+ - hpack=4.0.0=pyh9f0ad1d_0
88
+ - hyperframe=6.0.1=pyhd8ed1ab_0
89
+ - icu=75.1=he02047a_0
90
+ - idna=3.7=pyhd8ed1ab_0
91
+ - importlib-metadata=8.2.0=pyha770c72_0
92
+ - importlib_metadata=8.2.0=hd8ed1ab_0
93
+ - intel-openmp=2022.0.1=h06a4308_3633
94
+ - ipykernel=6.29.5=pyh3099207_0
95
+ - ipython=8.26.0=pyh707e725_0
96
+ - jedi=0.19.1=pyhd8ed1ab_0
97
+ - jinja2=3.1.4=pyhd8ed1ab_0
98
+ - jupyter_client=8.6.2=pyhd8ed1ab_0
99
+ - jupyter_core=5.7.2=py311h38be061_0
100
+ - keyutils=1.6.1=h166bdaf_0
101
+ - krb5=1.21.3=h659f571_0
102
+ - lame=3.100=h166bdaf_1003
103
+ - lcms2=2.16=hb7c19ff_0
104
+ - ld_impl_linux-64=2.40=hf3520f5_7
105
+ - lerc=4.0.0=h27087fc_0
106
+ - libabseil=20240116.2=cxx17_he02047a_1
107
+ - libasprintf=0.22.5=h661eb56_2
108
+ - libasprintf-devel=0.22.5=h661eb56_2
109
+ - libass=0.17.1=h39113c1_2
110
+ - libblas=3.9.0=16_linux64_mkl
111
+ - libcblas=3.9.0=16_linux64_mkl
112
+ - libcublas=12.1.0.26=0
113
+ - libcublas-dev=12.1.0.26=0
114
+ - libcublas-static=12.1.0.26=0
115
+ - libcufft=11.0.2.4=0
116
+ - libcufft-dev=11.0.2.4=0
117
+ - libcufft-static=11.0.2.4=0
118
+ - libcufile=1.6.0.25=0
119
+ - libcufile-dev=1.6.0.25=0
120
+ - libcufile-static=1.6.0.25=0
121
+ - libcurand=10.3.2.56=0
122
+ - libcurand-dev=10.3.2.56=0
123
+ - libcurand-static=10.3.2.56=0
124
+ - libcusolver=11.4.4.55=0
125
+ - libcusolver-dev=11.4.4.55=0
126
+ - libcusolver-static=11.4.4.55=0
127
+ - libcusparse=12.0.2.55=0
128
+ - libcusparse-dev=12.0.2.55=0
129
+ - libcusparse-static=12.0.2.55=0
130
+ - libdeflate=1.20=hd590300_0
131
+ - libdrm=2.4.122=h4ab18f5_0
132
+ - libedit=3.1.20191231=he28a2e2_2
133
+ - libexpat=2.6.2=h59595ed_0
134
+ - libffi=3.4.2=h7f98852_5
135
+ - libgcc-ng=14.1.0=h77fa898_0
136
+ - libgettextpo=0.22.5=h59595ed_2
137
+ - libgettextpo-devel=0.22.5=h59595ed_2
138
+ - libglib=2.80.3=h8a4344b_1
139
+ - libgomp=14.1.0=h77fa898_0
140
+ - libhwloc=2.11.1=default_hecaa2ac_1000
141
+ - libiconv=1.17=hd590300_2
142
+ - libidn2=2.3.7=hd590300_0
143
+ - libjpeg-turbo=3.0.0=hd590300_1
144
+ - liblapack=3.9.0=16_linux64_mkl
145
+ - libnpp=12.0.2.50=0
146
+ - libnpp-dev=12.0.2.50=0
147
+ - libnpp-static=12.0.2.50=0
148
+ - libnsl=2.0.1=hd590300_0
149
+ - libnvjitlink=12.1.105=0
150
+ - libnvjitlink-dev=12.1.55=0
151
+ - libnvjpeg=12.1.0.39=0
152
+ - libnvjpeg-dev=12.1.0.39=0
153
+ - libnvjpeg-static=12.1.0.39=0
154
+ - libnvvm-samples=12.1.55=0
155
+ - libopenvino=2024.2.0=h2da1b83_1
156
+ - libopenvino-auto-batch-plugin=2024.2.0=hb045406_1
157
+ - libopenvino-auto-plugin=2024.2.0=hb045406_1
158
+ - libopenvino-hetero-plugin=2024.2.0=h5c03a75_1
159
+ - libopenvino-intel-cpu-plugin=2024.2.0=h2da1b83_1
160
+ - libopenvino-intel-gpu-plugin=2024.2.0=h2da1b83_1
161
+ - libopenvino-intel-npu-plugin=2024.2.0=he02047a_1
162
+ - libopenvino-ir-frontend=2024.2.0=h5c03a75_1
163
+ - libopenvino-onnx-frontend=2024.2.0=h07e8aee_1
164
+ - libopenvino-paddle-frontend=2024.2.0=h07e8aee_1
165
+ - libopenvino-pytorch-frontend=2024.2.0=he02047a_1
166
+ - libopenvino-tensorflow-frontend=2024.2.0=h39126c6_1
167
+ - libopenvino-tensorflow-lite-frontend=2024.2.0=he02047a_1
168
+ - libopus=1.3.1=h7f98852_1
169
+ - libpciaccess=0.18=hd590300_0
170
+ - libpng=1.6.43=h2797004_0
171
+ - libprotobuf=4.25.3=h08a7969_0
172
+ - libsodium=1.0.18=h36c2ea0_1
173
+ - libsqlite=3.46.0=hde9e2c9_0
174
+ - libstdcxx-ng=14.1.0=hc0a3c3a_0
175
+ - libtasn1=4.19.0=h166bdaf_0
176
+ - libtiff=4.6.0=h1dd3fc0_3
177
+ - libunistring=0.9.10=h7f98852_0
178
+ - libuuid=2.38.1=h0b41bf4_0
179
+ - libva=2.22.0=hb711507_0
180
+ - libvpx=1.14.1=hac33072_0
181
+ - libwebp-base=1.4.0=hd590300_0
182
+ - libxcb=1.16=hd590300_0
183
+ - libxcrypt=4.4.36=hd590300_1
184
+ - libxml2=2.12.7=he7c6b58_4
185
+ - libzlib=1.3.1=h4ab18f5_1
186
+ - llvm-openmp=15.0.7=h0cdce71_0
187
+ - markupsafe=2.1.5=py311h459d7ec_0
188
+ - matplotlib-inline=0.1.7=pyhd8ed1ab_0
189
+ - mkl=2022.1.0=hc2b9512_224
190
+ - mpc=1.3.1=hfe3b2da_0
191
+ - mpfr=4.2.1=h38ae2d0_2
192
+ - mpmath=1.3.0=pyhd8ed1ab_0
193
+ - ncurses=6.5=h59595ed_0
194
+ - nest-asyncio=1.6.0=pyhd8ed1ab_0
195
+ - nettle=3.9.1=h7ab15ed_0
196
+ - networkx=3.3=pyhd8ed1ab_1
197
+ - nsight-compute=2023.1.0.15=0
198
+ - ocl-icd=2.3.2=hd590300_1
199
+ - openh264=2.4.1=h59595ed_0
200
+ - openjpeg=2.5.2=h488ebb8_0
201
+ - openssl=3.3.1=h4bc722e_2
202
+ - p11-kit=0.24.1=hc5aa10d_0
203
+ - packaging=24.1=pyhd8ed1ab_0
204
+ - parso=0.8.4=pyhd8ed1ab_0
205
+ - pcre2=10.44=h0f59acf_0
206
+ - pexpect=4.9.0=pyhd8ed1ab_0
207
+ - pickleshare=0.7.5=py_1003
208
+ - pillow=10.4.0=py311h82a398c_0
209
+ - pip=24.0=pyhd8ed1ab_0
210
+ - pixman=0.43.2=h59595ed_0
211
+ - prompt-toolkit=3.0.47=pyha770c72_0
212
+ - psutil=6.0.0=py311h331c9d8_0
213
+ - pthread-stubs=0.4=h36c2ea0_1001
214
+ - ptyprocess=0.7.0=pyhd3deb0d_0
215
+ - pugixml=1.14=h59595ed_0
216
+ - pure_eval=0.2.3=pyhd8ed1ab_0
217
+ - pycparser=2.22=pyhd8ed1ab_0
218
+ - pygments=2.18.0=pyhd8ed1ab_0
219
+ - pysocks=1.7.1=pyha2e5f31_6
220
+ - python=3.11.9=hb806964_0_cpython
221
+ - python_abi=3.11=4_cp311
222
+ - pytorch=2.4.0=py3.11_cuda12.1_cudnn9.1.0_0
223
+ - pytorch-cuda=12.1=ha16c6d3_5
224
+ - pytorch-mutex=1.0=cuda
225
+ - pyyaml=6.0.1=py311h459d7ec_1
226
+ - pyzmq=26.0.3=py311h08a0b41_0
227
+ - readline=8.2=h8228510_1
228
+ - requests=2.32.3=pyhd8ed1ab_0
229
+ - setuptools=71.0.4=pyhd8ed1ab_0
230
+ - six=1.16.0=pyh6c4a22f_0
231
+ - snappy=1.2.1=ha2e4443_0
232
+ - stack_data=0.6.2=pyhd8ed1ab_0
233
+ - svt-av1=2.1.2=hac33072_0
234
+ - sympy=1.13.0=pypyh2585a3b_103
235
+ - tbb=2021.12.0=h434a139_3
236
+ - tk=8.6.13=noxft_h4845f30_101
237
+ - torchaudio=2.4.0=py311_cu121
238
+ - torchtriton=3.0.0=py311
239
+ - tornado=6.4.1=py311h331c9d8_0
240
+ - traitlets=5.14.3=pyhd8ed1ab_0
241
+ - typing_extensions=4.12.2=pyha770c72_0
242
+ - urllib3=2.2.2=pyhd8ed1ab_1
243
+ - wayland=1.23.0=h5291e77_0
244
+ - wayland-protocols=1.36=hd8ed1ab_0
245
+ - wcwidth=0.2.13=pyhd8ed1ab_0
246
+ - wheel=0.43.0=pyhd8ed1ab_1
247
+ - x264=1!164.3095=h166bdaf_2
248
+ - x265=3.5=h924138e_3
249
+ - xorg-fixesproto=5.0=h7f98852_1002
250
+ - xorg-kbproto=1.0.7=h7f98852_1002
251
+ - xorg-libice=1.1.1=hd590300_0
252
+ - xorg-libsm=1.2.4=h7391055_0
253
+ - xorg-libx11=1.8.9=hb711507_1
254
+ - xorg-libxau=1.0.11=hd590300_0
255
+ - xorg-libxdmcp=1.1.3=h7f98852_0
256
+ - xorg-libxext=1.3.4=h0b41bf4_2
257
+ - xorg-libxfixes=5.0.3=h7f98852_1004
258
+ - xorg-libxrender=0.9.11=hd590300_0
259
+ - xorg-renderproto=0.11.1=h7f98852_1002
260
+ - xorg-xextproto=7.3.0=h0b41bf4_1003
261
+ - xorg-xproto=7.0.31=h7f98852_1007
262
+ - xz=5.2.6=h166bdaf_0
263
+ - yaml=0.2.5=h7f98852_2
264
+ - zeromq=4.3.5=h75354e8_4
265
+ - zipp=3.19.2=pyhd8ed1ab_0
266
+ - zlib=1.3.1=h4ab18f5_1
267
+ - zstandard=0.23.0=py311h5cd10c7_0
268
+ - zstd=1.5.6=ha6fb4c9_0
269
+ - pip:
270
+ - about-time==4.2.1
271
+ - absl-py==2.1.0
272
+ - accelerate==0.34.0
273
+ - aiofiles==23.2.1
274
+ - aiohttp==3.9.5
275
+ - aiohttp-retry==2.8.3
276
+ - aiosignal==1.3.1
277
+ - align-anything==0.0.1.dev0
278
+ - alive-progress==3.1.5
279
+ - amqp==5.2.0
280
+ - annotated-types==0.7.0
281
+ - antlr4-python3-runtime==4.9.3
282
+ - anyio==4.4.0
283
+ - appdirs==1.4.4
284
+ - asyncssh==2.16.0
285
+ - atpublic==5.0
286
+ - attrs==23.2.0
287
+ - audioread==3.0.1
288
+ - backoff==2.2.1
289
+ - billiard==4.2.0
290
+ - boto3==1.35.9
291
+ - botocore==1.35.9
292
+ - cachetools==5.4.0
293
+ - celery==5.4.0
294
+ - cfgv==3.4.0
295
+ - click==8.1.7
296
+ - click-didyoumean==0.3.1
297
+ - click-plugins==1.1.1
298
+ - click-repl==0.3.0
299
+ - cloudpickle==3.0.0
300
+ - cmake==3.30.1
301
+ - colorama==0.4.6
302
+ - commonmark==0.9.1
303
+ - configobj==5.0.8
304
+ - contourpy==1.2.1
305
+ - cryptography==43.0.0
306
+ - cycler==0.12.1
307
+ - dacite==1.6.0
308
+ - dagshub==0.3.35
309
+ - dagshub-annotation-converter==0.1.0
310
+ - dataclasses-json==0.6.7
311
+ - datasets==2.20.0
312
+ - decorator==4.4.2
313
+ - deepspeed==0.14.4
314
+ - dictdiffer==0.9.0
315
+ - diffusers==0.29.2
316
+ - dill==0.3.8
317
+ - diskcache==5.6.3
318
+ - distlib==0.3.8
319
+ - distro==1.9.0
320
+ - dnspython==2.6.1
321
+ - docker-pycreds==0.4.0
322
+ - docstring-parser==0.16
323
+ - dpath==2.2.0
324
+ - dulwich==0.22.1
325
+ - dvc==3.55.1
326
+ - dvc-data==3.16.5
327
+ - dvc-http==2.32.0
328
+ - dvc-objects==5.1.0
329
+ - dvc-render==1.0.2
330
+ - dvc-studio-client==0.21.0
331
+ - dvc-task==0.4.0
332
+ - einops==0.8.0
333
+ - email-validator==2.2.0
334
+ - entrypoints==0.4
335
+ - fastapi==0.111.1
336
+ - fastapi-cli==0.0.4
337
+ - ffmpy==0.3.3
338
+ - fire==0.6.0
339
+ - flatten-dict==0.4.2
340
+ - flufl-lock==8.1.0
341
+ - fonttools==4.53.1
342
+ - frozenlist==1.4.1
343
+ - fsspec==2024.5.0
344
+ - funcy==2.0
345
+ - fusepy==3.0.1
346
+ - gitdb==4.0.11
347
+ - gitpython==3.1.43
348
+ - gql==3.5.0
349
+ - gradio==4.39.0
350
+ - gradio-client==1.1.1
351
+ - gradio-multimodalchatbot==0.0.1
352
+ - grandalf==0.8
353
+ - grapheme==0.6.0
354
+ - graphql-core==3.2.3
355
+ - grpcio==1.65.1
356
+ - gto==1.7.1
357
+ - h11==0.14.0
358
+ - hjson==3.1.0
359
+ - httpcore==1.0.5
360
+ - httptools==0.6.1
361
+ - httpx==0.27.2
362
+ - huggingface-hub==0.24.3
363
+ - hydra-core==1.3.2
364
+ - identify==2.6.0
365
+ - imageio==2.35.1
366
+ - imageio-ffmpeg==0.5.1
367
+ - importlib-resources==6.4.0
368
+ - iniconfig==2.0.0
369
+ - interegular==0.3.3
370
+ - iterative-telemetry==0.0.8
371
+ - jmespath==1.0.1
372
+ - joblib==1.4.2
373
+ - jsonschema==4.23.0
374
+ - jsonschema-specifications==2023.12.1
375
+ - kiwisolver==1.4.5
376
+ - kombu==5.4.0
377
+ - lark==1.1.9
378
+ - lazy-loader==0.4
379
+ - librosa==0.10.2.post1
380
+ - llamafactory==0.8.4.dev0
381
+ - llvmlite==0.43.0
382
+ - lm-format-enforcer==0.10.3
383
+ - lxml==5.3.0
384
+ - markdown==3.6
385
+ - markdown-it-py==3.0.0
386
+ - marshmallow==3.22.0
387
+ - matplotlib==3.9.1
388
+ - mdurl==0.1.2
389
+ - mmsg==0.1.dev14+gbd2b056.d20240803
390
+ - moviepy==1.0.3
391
+ - mpi4py==4.0.0
392
+ - msgpack==1.0.8
393
+ - multidict==6.0.5
394
+ - multiprocess==0.70.16
395
+ - mypy-extensions==1.0.0
396
+ - ninja==1.11.1.1
397
+ - nodeenv==1.9.1
398
+ - numba==0.60.0
399
+ - numpy==1.26.4
400
+ - nvidia-cublas-cu12==12.1.3.1
401
+ - nvidia-cuda-cupti-cu12==12.1.105
402
+ - nvidia-cuda-nvrtc-cu12==12.1.105
403
+ - nvidia-cuda-runtime-cu12==12.1.105
404
+ - nvidia-cudnn-cu12==8.9.2.26
405
+ - nvidia-cufft-cu12==11.0.2.54
406
+ - nvidia-curand-cu12==10.3.2.106
407
+ - nvidia-cusolver-cu12==11.4.5.107
408
+ - nvidia-cusparse-cu12==12.1.0.106
409
+ - nvidia-ml-py==12.535.161
410
+ - nvidia-nccl-cu12==2.20.5
411
+ - nvidia-nvjitlink-cu12==12.5.82
412
+ - nvidia-nvtx-cu12==12.1.105
413
+ - nvitop==1.3.2
414
+ - omegaconf==2.3.0
415
+ - openai==1.37.1
416
+ - optree==0.12.1
417
+ - orjson==3.10.6
418
+ - outlines==0.0.47.dev37+g26e2934
419
+ - pandas==2.2.2
420
+ - pathspec==0.12.1
421
+ - pathvalidate==3.0.0
422
+ - peft==0.12.0
423
+ - platformdirs==3.11.0
424
+ - pluggy==1.5.0
425
+ - pooch==1.8.2
426
+ - pre-commit==3.8.0
427
+ - proglog==0.1.10
428
+ - prometheus-client==0.20.0
429
+ - prometheus-fastapi-instrumentator==7.0.0
430
+ - protobuf==4.25.4
431
+ - py-cpuinfo==9.0.0
432
+ - pyairports==2.1.1
433
+ - pyarrow==17.0.0
434
+ - pyarrow-hotfix==0.6
435
+ - pyav==13.0.0
436
+ - pycountry==24.6.1
437
+ - pydantic==2.8.2
438
+ - pydantic-core==2.20.1
439
+ - pydot==3.0.1
440
+ - pydub==0.25.1
441
+ - pygit2==1.15.1
442
+ - pygtrie==2.5.0
443
+ - pyparsing==3.1.2
444
+ - pytest==8.3.2
445
+ - python-dateutil==2.9.0.post0
446
+ - python-dotenv==1.0.1
447
+ - python-multipart==0.0.9
448
+ - pytz==2024.1
449
+ - ranger-fm==1.9.3
450
+ - ray==2.34.0
451
+ - referencing==0.35.1
452
+ - regex==2024.7.24
453
+ - requests-toolbelt==1.0.0
454
+ - rfc3986==1.5.0
455
+ - rich==13.1.0
456
+ - rpds-py==0.19.1
457
+ - ruamel-yaml==0.18.6
458
+ - ruamel-yaml-clib==0.2.8
459
+ - ruff==0.5.5
460
+ - s3transfer==0.10.2
461
+ - safetensors==0.4.3
462
+ - scikit-learn==1.5.1
463
+ - scipy==1.14.0
464
+ - scmrepo==3.3.7
465
+ - semantic-version==2.10.0
466
+ - semver==3.0.2
467
+ - sentencepiece==0.2.0
468
+ - sentry-sdk==2.11.0
469
+ - setproctitle==1.3.3
470
+ - shellingham==1.5.4
471
+ - shortuuid==1.0.13
472
+ - shtab==1.7.1
473
+ - smmap==5.0.1
474
+ - sniffio==1.3.1
475
+ - soundfile==0.12.1
476
+ - soxr==0.4.0
477
+ - sqltrie==0.11.1
478
+ - sse-starlette==2.1.3
479
+ - starlette==0.37.2
480
+ - tabulate==0.9.0
481
+ - tenacity==8.2.3
482
+ - tensorboard==2.17.0
483
+ - tensorboard-data-server==0.7.2
484
+ - term-image==0.7.2
485
+ - termcolor==2.4.0
486
+ - threadpoolctl==3.5.0
487
+ - tiktoken==0.7.0
488
+ - tokenizers==0.19.1
489
+ - tomlkit==0.12.0
490
+ - torch==2.3.1
491
+ - torchvision==0.18.1
492
+ - tqdm==4.66.4
493
+ - transformers==4.45.0.dev0
494
+ - treelib==1.6.4
495
+ - triton==2.3.1
496
+ - trl==0.9.6
497
+ - typer==0.12.3
498
+ - typing-inspect==0.9.0
499
+ - tyro==0.8.10
500
+ - tzdata==2024.1
501
+ - uvicorn==0.30.3
502
+ - uvloop==0.19.0
503
+ - vine==5.1.0
504
+ - virtualenv==20.26.3
505
+ - vllm==0.5.3.post1
506
+ - vllm-flash-attn==2.5.9.post1
507
+ - voluptuous==0.15.2
508
+ - wandb==0.17.5
509
+ - watchfiles==0.22.0
510
+ - websockets==11.0.3
511
+ - werkzeug==3.0.3
512
+ - xformers==0.0.27
513
+ - xxhash==3.4.1
514
+ - yarl==1.9.4
515
+ - zc-lockfile==3.0.post1
516
+ prefix: /aifs4su/yaodong/miniconda3/envs/hantao_tiv
wandb/run-20240921_115259-p9bvnzls/files/config.yaml ADDED
@@ -0,0 +1,111 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ wandb_version: 1
2
+
3
+ train_cfgs:
4
+ desc: null
5
+ value:
6
+ ds_cfgs: ds_z3_config.json
7
+ epochs: 3
8
+ seed: 42
9
+ per_device_train_batch_size: 1.0
10
+ per_device_eval_batch_size: 1.0
11
+ gradient_accumulation_steps: 1.0
12
+ gradient_checkpointing: true
13
+ learning_rate: 1.0e-06
14
+ lr_scheduler_type: cosine
15
+ lr_warmup_ratio: 0.01
16
+ weight_decay: 0.0
17
+ adam_betas:
18
+ - 0.9
19
+ - 0.95
20
+ bf16: true
21
+ fp16: false
22
+ eval_strategy: epoch
23
+ eval_interval: 10
24
+ regularization: 0.001
25
+ scale_coeff: 0.1
26
+ freeze_mm_proj: false
27
+ freeze_vision_tower: true
28
+ freeze_language_model: false
29
+ data_cfgs:
30
+ desc: null
31
+ value:
32
+ train_datasets: /aifs4su/yaodong/datasets/aaa_dataset/TV2T-preference/extracted
33
+ train_template: NExTQA_preference
34
+ train_size: null
35
+ train_split: train
36
+ train_subset: null
37
+ train_data_files: extracted_preference_1.5k_washed.json
38
+ train_optional_args: []
39
+ eval_datasets: null
40
+ eval_template: null
41
+ eval_size: null
42
+ eval_split: null
43
+ eval_subset: null
44
+ eval_data_files: null
45
+ eval_optional_args: []
46
+ logger_cfgs:
47
+ desc: null
48
+ value:
49
+ log_type: wandb
50
+ log_project: align-anything
51
+ log_run_name: dpo
52
+ output_dir: ../outputs/dpo_tiv2t_1.5k_base
53
+ cache_dir: null
54
+ save_interval: 100000
55
+ model_cfgs:
56
+ desc: null
57
+ value:
58
+ model_name_or_path: /aifs4su/yaodong/models/Qwen2-VL-7B-Instruct
59
+ trust_remote_code: true
60
+ model_max_length: 4096
61
+ special_tokens:
62
+ desc: null
63
+ value: null
64
+ _wandb:
65
+ desc: null
66
+ value:
67
+ python_version: 3.11.9
68
+ cli_version: 0.17.5
69
+ framework: huggingface
70
+ huggingface_version: 4.45.0.dev0
71
+ is_jupyter_run: false
72
+ is_kaggle_kernel: false
73
+ start_time: 1726890779
74
+ t:
75
+ 1:
76
+ - 1
77
+ - 5
78
+ - 11
79
+ - 41
80
+ - 49
81
+ - 51
82
+ - 53
83
+ - 55
84
+ - 71
85
+ - 83
86
+ - 98
87
+ - 105
88
+ 2:
89
+ - 1
90
+ - 5
91
+ - 11
92
+ - 41
93
+ - 49
94
+ - 51
95
+ - 53
96
+ - 55
97
+ - 71
98
+ - 83
99
+ - 98
100
+ - 105
101
+ 3:
102
+ - 13
103
+ - 16
104
+ - 23
105
+ - 61
106
+ 4: 3.11.9
107
+ 5: 0.17.5
108
+ 6: 4.45.0.dev0
109
+ 8:
110
+ - 5
111
+ 13: linux-x86_64
wandb/run-20240921_115259-p9bvnzls/files/output.log ADDED
@@ -0,0 +1,190 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+
2
+ ***** Running training *****
3
+
4
+ Training 1/3 epoch: 0%| | 0/531 [00:00<?, ?it/s]`use_cache=True` is incompatible with gradient checkpointing. Setting `use_cache=False`...
5
+ /aifs4su/yaodong/miniconda3/envs/hantao_tiv/lib/python3.11/site-packages/torch/utils/checkpoint.py:295: FutureWarning: `torch.cpu.amp.autocast(args...)` is deprecated. Please use `torch.amp.autocast('cpu', args...)` instead.
6
+ with torch.enable_grad(), device_autocast_ctx, torch.cpu.amp.autocast(**ctx.cpu_autocast_kwargs): # type: ignore[attr-defined]
7
+
8
+
9
+
10
+
11
+
12
+
13
+
14
+
15
+
16
+
17
+ Training 1/3 epoch (loss 1.9530): 2%|██▍ | 9/531 [01:54<1:39:32, 11.44s/it]
18
+
19
+
20
+
21
+
22
+
23
+
24
+
25
+
26
+
27
+
28
+ Training 1/3 epoch (loss 0.8921): 4%|█████ | 19/531 [03:48<1:32:14, 10.81s/it]
29
+
30
+
31
+
32
+
33
+
34
+
35
+
36
+
37
+
38
+
39
+ Training 1/3 epoch (loss 0.8901): 5%|███████▋ | 29/531 [05:46<1:37:31, 11.66s/it]
40
+
41
+
42
+
43
+
44
+
45
+
46
+
47
+
48
+
49
+
50
+ Training 1/3 epoch (loss 0.9671): 7%|██████████▎ | 39/531 [07:46<1:37:35, 11.90s/it]
51
+
52
+
53
+
54
+
55
+
56
+
57
+
58
+
59
+
60
+
61
+ Training 1/3 epoch (loss 1.4778): 9%|█████████████ | 49/531 [09:32<1:23:36, 10.41s/it]
62
+
63
+
64
+
65
+
66
+
67
+
68
+
69
+
70
+
71
+
72
+ Training 1/3 epoch (loss 0.3492): 11%|███████████████▋ | 59/531 [11:20<1:14:53, 9.52s/it]
73
+
74
+
75
+
76
+
77
+
78
+
79
+
80
+
81
+
82
+
83
+ Training 1/3 epoch (loss 0.6911): 13%|██████████████████▎ | 69/531 [12:54<1:14:58, 9.74s/it]
84
+
85
+
86
+
87
+
88
+
89
+
90
+
91
+
92
+
93
+
94
+ Training 1/3 epoch (loss 0.7152): 15%|████████████████████▉ | 79/531 [14:59<1:19:35, 10.57s/it]
95
+
96
+
97
+
98
+
99
+
100
+
101
+
102
+
103
+
104
+
105
+ Training 1/3 epoch (loss 0.5334): 17%|███████████████████████▋ | 89/531 [16:40<1:15:43, 10.28s/it]
106
+
107
+
108
+
109
+
110
+
111
+
112
+
113
+
114
+
115
+
116
+ Training 1/3 epoch (loss 0.4098): 19%|██████████████████████████▎ | 99/531 [18:32<1:10:19, 9.77s/it]
117
+
118
+
119
+
120
+
121
+
122
+
123
+
124
+
125
+
126
+
127
+ Training 1/3 epoch (loss 0.4588): 21%|████████████████████████████▋ | 109/531 [20:15<1:15:50, 10.78s/it]
128
+
129
+
130
+
131
+
132
+
133
+
134
+
135
+
136
+
137
+
138
+ Training 1/3 epoch (loss 1.6005): 22%|███████████████████████████████▎ | 119/531 [21:59<1:05:54, 9.60s/it]
139
+
140
+
141
+
142
+
143
+
144
+
145
+
146
+
147
+
148
+
149
+ Training 1/3 epoch (loss 0.2724): 24%|██████████████████████████████████ | 129/531 [23:35<1:06:56, 9.99s/it]
150
+
151
+
152
+
153
+
154
+
155
+
156
+
157
+
158
+
159
+
160
+ Training 1/3 epoch (loss 1.3423): 26%|████████████████████████████████████▋ | 139/531 [25:06<1:00:28, 9.26s/it]
161
+
162
+
163
+
164
+
165
+
166
+
167
+
168
+
169
+
170
+
171
+ Training 1/3 epoch (loss 0.4799): 28%|███████████████████████████████████████▎ | 149/531 [26:57<1:20:06, 12.58s/it]
172
+
173
+
174
+
175
+
176
+
177
+
178
+
179
+
180
+
181
+
182
+ Training 1/3 epoch (loss 0.2165): 30%|█████████████████████████████████████████▉ | 159/531 [29:00<1:02:28, 10.08s/it]
183
+
184
+
185
+
186
+
187
+
188
+
189
+
190
+
wandb/run-20240921_115259-p9bvnzls/files/requirements.txt ADDED
@@ -0,0 +1,325 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ Brotli==1.1.0
2
+ GitPython==3.1.43
3
+ Jinja2==3.1.4
4
+ Markdown==3.6
5
+ MarkupSafe==2.1.5
6
+ PySocks==1.7.1
7
+ PyYAML==6.0.1
8
+ Pygments==2.18.0
9
+ Werkzeug==3.0.3
10
+ about-time==4.2.1
11
+ absl-py==2.1.0
12
+ accelerate==0.34.0
13
+ aiofiles==23.2.1
14
+ aiohttp-retry==2.8.3
15
+ aiohttp==3.9.5
16
+ aiosignal==1.3.1
17
+ align-anything==0.0.1.dev0
18
+ align-anything==0.0.1.dev0
19
+ alive-progress==3.1.5
20
+ amqp==5.2.0
21
+ annotated-types==0.7.0
22
+ antlr4-python3-runtime==4.9.3
23
+ anyio==4.4.0
24
+ appdirs==1.4.4
25
+ asttokens==2.4.1
26
+ asyncssh==2.16.0
27
+ atpublic==5.0
28
+ attrs==23.2.0
29
+ audioread==3.0.1
30
+ autocommand==2.2.2
31
+ backoff==2.2.1
32
+ backports.tarfile==1.2.0
33
+ billiard==4.2.0
34
+ boto3==1.35.9
35
+ botocore==1.35.9
36
+ cachetools==5.4.0
37
+ celery==5.4.0
38
+ certifi==2024.7.4
39
+ cffi==1.16.0
40
+ cfgv==3.4.0
41
+ charset-normalizer==3.3.2
42
+ click-didyoumean==0.3.1
43
+ click-plugins==1.1.1
44
+ click-repl==0.3.0
45
+ click==8.1.7
46
+ cloudpickle==3.0.0
47
+ cmake==3.30.1
48
+ colorama==0.4.6
49
+ comm==0.2.2
50
+ commonmark==0.9.1
51
+ configobj==5.0.8
52
+ contourpy==1.2.1
53
+ cryptography==43.0.0
54
+ cycler==0.12.1
55
+ dacite==1.6.0
56
+ dagshub-annotation-converter==0.1.0
57
+ dagshub==0.3.35
58
+ dataclasses-json==0.6.7
59
+ datasets==2.20.0
60
+ debugpy==1.8.2
61
+ decorator==4.4.2
62
+ deepspeed==0.14.4
63
+ dictdiffer==0.9.0
64
+ diffusers==0.29.2
65
+ dill==0.3.8
66
+ diskcache==5.6.3
67
+ distlib==0.3.8
68
+ distro==1.9.0
69
+ dnspython==2.6.1
70
+ docker-pycreds==0.4.0
71
+ docstring_parser==0.16
72
+ dpath==2.2.0
73
+ dulwich==0.22.1
74
+ dvc-data==3.16.5
75
+ dvc-http==2.32.0
76
+ dvc-objects==5.1.0
77
+ dvc-render==1.0.2
78
+ dvc-studio-client==0.21.0
79
+ dvc-task==0.4.0
80
+ dvc==3.55.1
81
+ einops==0.8.0
82
+ email_validator==2.2.0
83
+ entrypoints==0.4
84
+ exceptiongroup==1.2.2
85
+ executing==2.0.1
86
+ fastapi-cli==0.0.4
87
+ fastapi==0.111.1
88
+ ffmpy==0.3.3
89
+ filelock==3.15.4
90
+ fire==0.6.0
91
+ flatten-dict==0.4.2
92
+ flufl.lock==8.1.0
93
+ fonttools==4.53.1
94
+ frozenlist==1.4.1
95
+ fsspec==2024.5.0
96
+ funcy==2.0
97
+ fusepy==3.0.1
98
+ gitdb==4.0.11
99
+ gmpy2==2.1.5
100
+ gql==3.5.0
101
+ gradio==4.39.0
102
+ gradio_client==1.1.1
103
+ gradio_multimodalchatbot==0.0.1
104
+ grandalf==0.8
105
+ grapheme==0.6.0
106
+ graphql-core==3.2.3
107
+ grpcio==1.65.1
108
+ gto==1.7.1
109
+ h11==0.14.0
110
+ h2==4.1.0
111
+ hjson==3.1.0
112
+ hpack==4.0.0
113
+ httpcore==1.0.5
114
+ httptools==0.6.1
115
+ httpx==0.27.2
116
+ huggingface-hub==0.24.3
117
+ hydra-core==1.3.2
118
+ hyperframe==6.0.1
119
+ identify==2.6.0
120
+ idna==3.7
121
+ imageio-ffmpeg==0.5.1
122
+ imageio==2.35.1
123
+ importlib_metadata==8.0.0
124
+ importlib_metadata==8.2.0
125
+ importlib_resources==6.4.0
126
+ importlib_resources==6.4.0
127
+ inflect==7.3.1
128
+ iniconfig==2.0.0
129
+ interegular==0.3.3
130
+ ipykernel==6.29.5
131
+ ipython==8.26.0
132
+ iterative-telemetry==0.0.8
133
+ jaraco.context==5.3.0
134
+ jaraco.functools==4.0.1
135
+ jaraco.text==3.12.1
136
+ jedi==0.19.1
137
+ jmespath==1.0.1
138
+ joblib==1.4.2
139
+ jsonschema-specifications==2023.12.1
140
+ jsonschema==4.23.0
141
+ jupyter_client==8.6.2
142
+ jupyter_core==5.7.2
143
+ kiwisolver==1.4.5
144
+ kombu==5.4.0
145
+ lark==1.1.9
146
+ lazy_loader==0.4
147
+ librosa==0.10.2.post1
148
+ llamafactory==0.8.4.dev0
149
+ llamafactory==0.8.4.dev0
150
+ llvmlite==0.43.0
151
+ lm-format-enforcer==0.10.3
152
+ lxml==5.3.0
153
+ markdown-it-py==3.0.0
154
+ marshmallow==3.22.0
155
+ matplotlib-inline==0.1.7
156
+ matplotlib==3.9.1
157
+ mdurl==0.1.2
158
+ mmsg==0.1.dev14+gbd2b056.d20240803
159
+ more-itertools==10.3.0
160
+ moviepy==1.0.3
161
+ mpi4py==4.0.0
162
+ mpmath==1.3.0
163
+ msgpack==1.0.8
164
+ multidict==6.0.5
165
+ multiprocess==0.70.16
166
+ mypy-extensions==1.0.0
167
+ nest_asyncio==1.6.0
168
+ networkx==3.3
169
+ ninja==1.11.1.1
170
+ nodeenv==1.9.1
171
+ numba==0.60.0
172
+ numpy==1.26.4
173
+ nvidia-cublas-cu12==12.1.3.1
174
+ nvidia-cuda-cupti-cu12==12.1.105
175
+ nvidia-cuda-nvrtc-cu12==12.1.105
176
+ nvidia-cuda-runtime-cu12==12.1.105
177
+ nvidia-cudnn-cu12==8.9.2.26
178
+ nvidia-cufft-cu12==11.0.2.54
179
+ nvidia-curand-cu12==10.3.2.106
180
+ nvidia-cusolver-cu12==11.4.5.107
181
+ nvidia-cusparse-cu12==12.1.0.106
182
+ nvidia-ml-py==12.535.161
183
+ nvidia-nccl-cu12==2.20.5
184
+ nvidia-nvjitlink-cu12==12.5.82
185
+ nvidia-nvtx-cu12==12.1.105
186
+ nvitop==1.3.2
187
+ omegaconf==2.3.0
188
+ openai==1.37.1
189
+ optree==0.12.1
190
+ ordered-set==4.1.0
191
+ orjson==3.10.6
192
+ outlines==0.0.47.dev37+g26e2934
193
+ packaging==24.1
194
+ packaging==24.1
195
+ pandas==2.2.2
196
+ parso==0.8.4
197
+ pathspec==0.12.1
198
+ pathvalidate==3.0.0
199
+ peft==0.12.0
200
+ pexpect==4.9.0
201
+ pickleshare==0.7.5
202
+ pillow==10.4.0
203
+ pip==24.0
204
+ platformdirs==3.11.0
205
+ platformdirs==4.2.2
206
+ pluggy==1.5.0
207
+ pooch==1.8.2
208
+ pre-commit==3.8.0
209
+ proglog==0.1.10
210
+ prometheus-fastapi-instrumentator==7.0.0
211
+ prometheus_client==0.20.0
212
+ prompt_toolkit==3.0.47
213
+ protobuf==4.25.4
214
+ psutil==6.0.0
215
+ ptyprocess==0.7.0
216
+ pure_eval==0.2.3
217
+ py-cpuinfo==9.0.0
218
+ pyairports==2.1.1
219
+ pyarrow-hotfix==0.6
220
+ pyarrow==17.0.0
221
+ pyav==13.0.0
222
+ pycountry==24.6.1
223
+ pycparser==2.22
224
+ pydantic==2.8.2
225
+ pydantic_core==2.20.1
226
+ pydot==3.0.1
227
+ pydub==0.25.1
228
+ pygit2==1.15.1
229
+ pygtrie==2.5.0
230
+ pyparsing==3.1.2
231
+ pytest==8.3.2
232
+ python-dateutil==2.9.0
233
+ python-dateutil==2.9.0.post0
234
+ python-dotenv==1.0.1
235
+ python-multipart==0.0.9
236
+ pytz==2024.1
237
+ pyzmq==26.0.3
238
+ ranger-fm==1.9.3
239
+ ray==2.34.0
240
+ referencing==0.35.1
241
+ regex==2024.7.24
242
+ requests-toolbelt==1.0.0
243
+ requests==2.32.3
244
+ rfc3986==1.5.0
245
+ rich==13.1.0
246
+ rpds-py==0.19.1
247
+ ruamel.yaml.clib==0.2.8
248
+ ruamel.yaml==0.18.6
249
+ ruff==0.5.5
250
+ s3transfer==0.10.2
251
+ safetensors==0.4.3
252
+ scikit-learn==1.5.1
253
+ scipy==1.14.0
254
+ scmrepo==3.3.7
255
+ semantic-version==2.10.0
256
+ semver==3.0.2
257
+ sentencepiece==0.2.0
258
+ sentry-sdk==2.11.0
259
+ setproctitle==1.3.3
260
+ setuptools==71.0.4
261
+ shellingham==1.5.4
262
+ shortuuid==1.0.13
263
+ shtab==1.7.1
264
+ six==1.16.0
265
+ smmap==5.0.1
266
+ sniffio==1.3.1
267
+ soundfile==0.12.1
268
+ soxr==0.4.0
269
+ sqltrie==0.11.1
270
+ sse-starlette==2.1.3
271
+ stack-data==0.6.2
272
+ starlette==0.37.2
273
+ sympy==1.13.0
274
+ tabulate==0.9.0
275
+ tenacity==8.2.3
276
+ tensorboard-data-server==0.7.2
277
+ tensorboard==2.17.0
278
+ term-image==0.7.2
279
+ termcolor==2.4.0
280
+ threadpoolctl==3.5.0
281
+ tiktoken==0.7.0
282
+ tokenizers==0.19.1
283
+ tomli==2.0.1
284
+ tomlkit==0.12.0
285
+ torch==2.3.1
286
+ torch==2.4.0
287
+ torchaudio==2.4.0
288
+ torchvision==0.18.1
289
+ torchvision==0.19.0
290
+ tornado==6.4.1
291
+ tqdm==4.66.4
292
+ traitlets==5.14.3
293
+ transformers==4.45.0.dev0
294
+ treelib==1.6.4
295
+ triton==2.3.1
296
+ triton==3.0.0
297
+ trl==0.9.6
298
+ typeguard==4.3.0
299
+ typer==0.12.3
300
+ typing-inspect==0.9.0
301
+ typing_extensions==4.12.2
302
+ typing_extensions==4.12.2
303
+ tyro==0.8.10
304
+ tzdata==2024.1
305
+ urllib3==2.2.2
306
+ uvicorn==0.30.3
307
+ uvloop==0.19.0
308
+ vine==5.1.0
309
+ virtualenv==20.26.3
310
+ vllm-flash-attn==2.5.9.post1
311
+ vllm==0.5.3.post1
312
+ voluptuous==0.15.2
313
+ wandb==0.17.5
314
+ watchfiles==0.22.0
315
+ wcwidth==0.2.13
316
+ websockets==11.0.3
317
+ wheel==0.43.0
318
+ wheel==0.43.0
319
+ xformers==0.0.27
320
+ xxhash==3.4.1
321
+ yarl==1.9.4
322
+ zc.lockfile==3.0.post1
323
+ zipp==3.19.2
324
+ zipp==3.19.2
325
+ zstandard==0.23.0
wandb/run-20240921_115259-p9bvnzls/files/wandb-metadata.json ADDED
@@ -0,0 +1,1215 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "os": "Linux-5.15.0-1040-nvidia-x86_64-with-glibc2.35",
3
+ "python": "3.11.9",
4
+ "heartbeatAt": "2024-09-21T03:53:00.216617",
5
+ "startedAt": "2024-09-21T03:52:59.188378",
6
+ "docker": null,
7
+ "cuda": null,
8
+ "args": [
9
+ "--local_rank=0",
10
+ "--model_name_or_path",
11
+ "/aifs4su/yaodong/models/Qwen2-VL-7B-Instruct",
12
+ "--train_datasets",
13
+ "/aifs4su/yaodong/datasets/aaa_dataset/TV2T-preference/extracted",
14
+ "--output_dir",
15
+ "../outputs/dpo_tiv2t_1.5k_base",
16
+ "--train_data_files",
17
+ "extracted_preference_1.5k_washed.json",
18
+ "--train_template",
19
+ "NExTQA_preference",
20
+ "--train_split",
21
+ "train",
22
+ "--per_device_train_batch_size",
23
+ "1",
24
+ "--per_device_eval_batch_size",
25
+ "1",
26
+ "--gradient_accumulation_steps",
27
+ "1"
28
+ ],
29
+ "state": "running",
30
+ "program": "-m align_anything.trainers.tiv_to_t.dpo",
31
+ "codePathLocal": null,
32
+ "git": {
33
+ "remote": "git@github.com-hantao:htlou/align-anything.git",
34
+ "commit": "9eff99b0ee34f7265b8a2e1824650634c898f654"
35
+ },
36
+ "email": "2200017789@stu.pku.edu.cn",
37
+ "root": "/aifs4su/yaodong/projects/hantao/dev_cham/align-anything",
38
+ "host": "dgx-122",
39
+ "username": "yangyaodong",
40
+ "executable": "/aifs4su/yaodong/miniconda3/envs/hantao_tiv/bin/python3.11",
41
+ "cpu_count": 112,
42
+ "cpu_count_logical": 224,
43
+ "cpu_freq": {
44
+ "current": 2053.164705357143,
45
+ "min": 800.0,
46
+ "max": 3800.0
47
+ },
48
+ "cpu_freq_per_core": [
49
+ {
50
+ "current": 2000.0,
51
+ "min": 800.0,
52
+ "max": 3800.0
53
+ },
54
+ {
55
+ "current": 2000.0,
56
+ "min": 800.0,
57
+ "max": 3800.0
58
+ },
59
+ {
60
+ "current": 2000.0,
61
+ "min": 800.0,
62
+ "max": 3800.0
63
+ },
64
+ {
65
+ "current": 2000.0,
66
+ "min": 800.0,
67
+ "max": 3800.0
68
+ },
69
+ {
70
+ "current": 2000.0,
71
+ "min": 800.0,
72
+ "max": 3800.0
73
+ },
74
+ {
75
+ "current": 2000.0,
76
+ "min": 800.0,
77
+ "max": 3800.0
78
+ },
79
+ {
80
+ "current": 2999.728,
81
+ "min": 800.0,
82
+ "max": 3800.0
83
+ },
84
+ {
85
+ "current": 2000.0,
86
+ "min": 800.0,
87
+ "max": 3800.0
88
+ },
89
+ {
90
+ "current": 3000.0,
91
+ "min": 800.0,
92
+ "max": 3800.0
93
+ },
94
+ {
95
+ "current": 2000.0,
96
+ "min": 800.0,
97
+ "max": 3800.0
98
+ },
99
+ {
100
+ "current": 2999.218,
101
+ "min": 800.0,
102
+ "max": 3800.0
103
+ },
104
+ {
105
+ "current": 2000.0,
106
+ "min": 800.0,
107
+ "max": 3800.0
108
+ },
109
+ {
110
+ "current": 2000.0,
111
+ "min": 800.0,
112
+ "max": 3800.0
113
+ },
114
+ {
115
+ "current": 3000.0,
116
+ "min": 800.0,
117
+ "max": 3800.0
118
+ },
119
+ {
120
+ "current": 2000.0,
121
+ "min": 800.0,
122
+ "max": 3800.0
123
+ },
124
+ {
125
+ "current": 2000.0,
126
+ "min": 800.0,
127
+ "max": 3800.0
128
+ },
129
+ {
130
+ "current": 2000.0,
131
+ "min": 800.0,
132
+ "max": 3800.0
133
+ },
134
+ {
135
+ "current": 2000.0,
136
+ "min": 800.0,
137
+ "max": 3800.0
138
+ },
139
+ {
140
+ "current": 3000.0,
141
+ "min": 800.0,
142
+ "max": 3800.0
143
+ },
144
+ {
145
+ "current": 2000.0,
146
+ "min": 800.0,
147
+ "max": 3800.0
148
+ },
149
+ {
150
+ "current": 2000.0,
151
+ "min": 800.0,
152
+ "max": 3800.0
153
+ },
154
+ {
155
+ "current": 2000.0,
156
+ "min": 800.0,
157
+ "max": 3800.0
158
+ },
159
+ {
160
+ "current": 2000.0,
161
+ "min": 800.0,
162
+ "max": 3800.0
163
+ },
164
+ {
165
+ "current": 2000.0,
166
+ "min": 800.0,
167
+ "max": 3800.0
168
+ },
169
+ {
170
+ "current": 3000.001,
171
+ "min": 800.0,
172
+ "max": 3800.0
173
+ },
174
+ {
175
+ "current": 2000.0,
176
+ "min": 800.0,
177
+ "max": 3800.0
178
+ },
179
+ {
180
+ "current": 2000.0,
181
+ "min": 800.0,
182
+ "max": 3800.0
183
+ },
184
+ {
185
+ "current": 2000.0,
186
+ "min": 800.0,
187
+ "max": 3800.0
188
+ },
189
+ {
190
+ "current": 2000.0,
191
+ "min": 800.0,
192
+ "max": 3800.0
193
+ },
194
+ {
195
+ "current": 3000.0,
196
+ "min": 800.0,
197
+ "max": 3800.0
198
+ },
199
+ {
200
+ "current": 2000.0,
201
+ "min": 800.0,
202
+ "max": 3800.0
203
+ },
204
+ {
205
+ "current": 2000.0,
206
+ "min": 800.0,
207
+ "max": 3800.0
208
+ },
209
+ {
210
+ "current": 2000.0,
211
+ "min": 800.0,
212
+ "max": 3800.0
213
+ },
214
+ {
215
+ "current": 2000.0,
216
+ "min": 800.0,
217
+ "max": 3800.0
218
+ },
219
+ {
220
+ "current": 2000.0,
221
+ "min": 800.0,
222
+ "max": 3800.0
223
+ },
224
+ {
225
+ "current": 2000.0,
226
+ "min": 800.0,
227
+ "max": 3800.0
228
+ },
229
+ {
230
+ "current": 2000.0,
231
+ "min": 800.0,
232
+ "max": 3800.0
233
+ },
234
+ {
235
+ "current": 2000.0,
236
+ "min": 800.0,
237
+ "max": 3800.0
238
+ },
239
+ {
240
+ "current": 2000.0,
241
+ "min": 800.0,
242
+ "max": 3800.0
243
+ },
244
+ {
245
+ "current": 2000.0,
246
+ "min": 800.0,
247
+ "max": 3800.0
248
+ },
249
+ {
250
+ "current": 2000.0,
251
+ "min": 800.0,
252
+ "max": 3800.0
253
+ },
254
+ {
255
+ "current": 2000.0,
256
+ "min": 800.0,
257
+ "max": 3800.0
258
+ },
259
+ {
260
+ "current": 2000.0,
261
+ "min": 800.0,
262
+ "max": 3800.0
263
+ },
264
+ {
265
+ "current": 2000.0,
266
+ "min": 800.0,
267
+ "max": 3800.0
268
+ },
269
+ {
270
+ "current": 2000.0,
271
+ "min": 800.0,
272
+ "max": 3800.0
273
+ },
274
+ {
275
+ "current": 2000.0,
276
+ "min": 800.0,
277
+ "max": 3800.0
278
+ },
279
+ {
280
+ "current": 2000.0,
281
+ "min": 800.0,
282
+ "max": 3800.0
283
+ },
284
+ {
285
+ "current": 2000.0,
286
+ "min": 800.0,
287
+ "max": 3800.0
288
+ },
289
+ {
290
+ "current": 2000.0,
291
+ "min": 800.0,
292
+ "max": 3800.0
293
+ },
294
+ {
295
+ "current": 2000.0,
296
+ "min": 800.0,
297
+ "max": 3800.0
298
+ },
299
+ {
300
+ "current": 2000.0,
301
+ "min": 800.0,
302
+ "max": 3800.0
303
+ },
304
+ {
305
+ "current": 2000.0,
306
+ "min": 800.0,
307
+ "max": 3800.0
308
+ },
309
+ {
310
+ "current": 2000.0,
311
+ "min": 800.0,
312
+ "max": 3800.0
313
+ },
314
+ {
315
+ "current": 2000.0,
316
+ "min": 800.0,
317
+ "max": 3800.0
318
+ },
319
+ {
320
+ "current": 2000.0,
321
+ "min": 800.0,
322
+ "max": 3800.0
323
+ },
324
+ {
325
+ "current": 2000.0,
326
+ "min": 800.0,
327
+ "max": 3800.0
328
+ },
329
+ {
330
+ "current": 2000.0,
331
+ "min": 800.0,
332
+ "max": 3800.0
333
+ },
334
+ {
335
+ "current": 2000.0,
336
+ "min": 800.0,
337
+ "max": 3800.0
338
+ },
339
+ {
340
+ "current": 2000.0,
341
+ "min": 800.0,
342
+ "max": 3800.0
343
+ },
344
+ {
345
+ "current": 2000.0,
346
+ "min": 800.0,
347
+ "max": 3800.0
348
+ },
349
+ {
350
+ "current": 2000.0,
351
+ "min": 800.0,
352
+ "max": 3800.0
353
+ },
354
+ {
355
+ "current": 2000.0,
356
+ "min": 800.0,
357
+ "max": 3800.0
358
+ },
359
+ {
360
+ "current": 2000.0,
361
+ "min": 800.0,
362
+ "max": 3800.0
363
+ },
364
+ {
365
+ "current": 2000.0,
366
+ "min": 800.0,
367
+ "max": 3800.0
368
+ },
369
+ {
370
+ "current": 2000.0,
371
+ "min": 800.0,
372
+ "max": 3800.0
373
+ },
374
+ {
375
+ "current": 2000.0,
376
+ "min": 800.0,
377
+ "max": 3800.0
378
+ },
379
+ {
380
+ "current": 2000.0,
381
+ "min": 800.0,
382
+ "max": 3800.0
383
+ },
384
+ {
385
+ "current": 2000.0,
386
+ "min": 800.0,
387
+ "max": 3800.0
388
+ },
389
+ {
390
+ "current": 2000.0,
391
+ "min": 800.0,
392
+ "max": 3800.0
393
+ },
394
+ {
395
+ "current": 2000.0,
396
+ "min": 800.0,
397
+ "max": 3800.0
398
+ },
399
+ {
400
+ "current": 2000.0,
401
+ "min": 800.0,
402
+ "max": 3800.0
403
+ },
404
+ {
405
+ "current": 2900.0,
406
+ "min": 800.0,
407
+ "max": 3800.0
408
+ },
409
+ {
410
+ "current": 2000.0,
411
+ "min": 800.0,
412
+ "max": 3800.0
413
+ },
414
+ {
415
+ "current": 2000.0,
416
+ "min": 800.0,
417
+ "max": 3800.0
418
+ },
419
+ {
420
+ "current": 2000.0,
421
+ "min": 800.0,
422
+ "max": 3800.0
423
+ },
424
+ {
425
+ "current": 2000.0,
426
+ "min": 800.0,
427
+ "max": 3800.0
428
+ },
429
+ {
430
+ "current": 2000.0,
431
+ "min": 800.0,
432
+ "max": 3800.0
433
+ },
434
+ {
435
+ "current": 2000.0,
436
+ "min": 800.0,
437
+ "max": 3800.0
438
+ },
439
+ {
440
+ "current": 2000.0,
441
+ "min": 800.0,
442
+ "max": 3800.0
443
+ },
444
+ {
445
+ "current": 2000.0,
446
+ "min": 800.0,
447
+ "max": 3800.0
448
+ },
449
+ {
450
+ "current": 2000.0,
451
+ "min": 800.0,
452
+ "max": 3800.0
453
+ },
454
+ {
455
+ "current": 2000.0,
456
+ "min": 800.0,
457
+ "max": 3800.0
458
+ },
459
+ {
460
+ "current": 2000.0,
461
+ "min": 800.0,
462
+ "max": 3800.0
463
+ },
464
+ {
465
+ "current": 2000.0,
466
+ "min": 800.0,
467
+ "max": 3800.0
468
+ },
469
+ {
470
+ "current": 2000.0,
471
+ "min": 800.0,
472
+ "max": 3800.0
473
+ },
474
+ {
475
+ "current": 2000.0,
476
+ "min": 800.0,
477
+ "max": 3800.0
478
+ },
479
+ {
480
+ "current": 2000.0,
481
+ "min": 800.0,
482
+ "max": 3800.0
483
+ },
484
+ {
485
+ "current": 2000.0,
486
+ "min": 800.0,
487
+ "max": 3800.0
488
+ },
489
+ {
490
+ "current": 2000.0,
491
+ "min": 800.0,
492
+ "max": 3800.0
493
+ },
494
+ {
495
+ "current": 2000.0,
496
+ "min": 800.0,
497
+ "max": 3800.0
498
+ },
499
+ {
500
+ "current": 2000.0,
501
+ "min": 800.0,
502
+ "max": 3800.0
503
+ },
504
+ {
505
+ "current": 2000.0,
506
+ "min": 800.0,
507
+ "max": 3800.0
508
+ },
509
+ {
510
+ "current": 2000.0,
511
+ "min": 800.0,
512
+ "max": 3800.0
513
+ },
514
+ {
515
+ "current": 2000.0,
516
+ "min": 800.0,
517
+ "max": 3800.0
518
+ },
519
+ {
520
+ "current": 2000.0,
521
+ "min": 800.0,
522
+ "max": 3800.0
523
+ },
524
+ {
525
+ "current": 2000.0,
526
+ "min": 800.0,
527
+ "max": 3800.0
528
+ },
529
+ {
530
+ "current": 2000.0,
531
+ "min": 800.0,
532
+ "max": 3800.0
533
+ },
534
+ {
535
+ "current": 2000.0,
536
+ "min": 800.0,
537
+ "max": 3800.0
538
+ },
539
+ {
540
+ "current": 2000.0,
541
+ "min": 800.0,
542
+ "max": 3800.0
543
+ },
544
+ {
545
+ "current": 2000.0,
546
+ "min": 800.0,
547
+ "max": 3800.0
548
+ },
549
+ {
550
+ "current": 2000.0,
551
+ "min": 800.0,
552
+ "max": 3800.0
553
+ },
554
+ {
555
+ "current": 2000.0,
556
+ "min": 800.0,
557
+ "max": 3800.0
558
+ },
559
+ {
560
+ "current": 2000.0,
561
+ "min": 800.0,
562
+ "max": 3800.0
563
+ },
564
+ {
565
+ "current": 2000.0,
566
+ "min": 800.0,
567
+ "max": 3800.0
568
+ },
569
+ {
570
+ "current": 2000.0,
571
+ "min": 800.0,
572
+ "max": 3800.0
573
+ },
574
+ {
575
+ "current": 2900.0,
576
+ "min": 800.0,
577
+ "max": 3800.0
578
+ },
579
+ {
580
+ "current": 2000.0,
581
+ "min": 800.0,
582
+ "max": 3800.0
583
+ },
584
+ {
585
+ "current": 2000.0,
586
+ "min": 800.0,
587
+ "max": 3800.0
588
+ },
589
+ {
590
+ "current": 2000.0,
591
+ "min": 800.0,
592
+ "max": 3800.0
593
+ },
594
+ {
595
+ "current": 2000.0,
596
+ "min": 800.0,
597
+ "max": 3800.0
598
+ },
599
+ {
600
+ "current": 2000.0,
601
+ "min": 800.0,
602
+ "max": 3800.0
603
+ },
604
+ {
605
+ "current": 2000.0,
606
+ "min": 800.0,
607
+ "max": 3800.0
608
+ },
609
+ {
610
+ "current": 2000.0,
611
+ "min": 800.0,
612
+ "max": 3800.0
613
+ },
614
+ {
615
+ "current": 2000.0,
616
+ "min": 800.0,
617
+ "max": 3800.0
618
+ },
619
+ {
620
+ "current": 2000.0,
621
+ "min": 800.0,
622
+ "max": 3800.0
623
+ },
624
+ {
625
+ "current": 2000.0,
626
+ "min": 800.0,
627
+ "max": 3800.0
628
+ },
629
+ {
630
+ "current": 2000.0,
631
+ "min": 800.0,
632
+ "max": 3800.0
633
+ },
634
+ {
635
+ "current": 2000.0,
636
+ "min": 800.0,
637
+ "max": 3800.0
638
+ },
639
+ {
640
+ "current": 2000.0,
641
+ "min": 800.0,
642
+ "max": 3800.0
643
+ },
644
+ {
645
+ "current": 2000.0,
646
+ "min": 800.0,
647
+ "max": 3800.0
648
+ },
649
+ {
650
+ "current": 2000.0,
651
+ "min": 800.0,
652
+ "max": 3800.0
653
+ },
654
+ {
655
+ "current": 2000.0,
656
+ "min": 800.0,
657
+ "max": 3800.0
658
+ },
659
+ {
660
+ "current": 2000.0,
661
+ "min": 800.0,
662
+ "max": 3800.0
663
+ },
664
+ {
665
+ "current": 2000.0,
666
+ "min": 800.0,
667
+ "max": 3800.0
668
+ },
669
+ {
670
+ "current": 2000.0,
671
+ "min": 800.0,
672
+ "max": 3800.0
673
+ },
674
+ {
675
+ "current": 2000.0,
676
+ "min": 800.0,
677
+ "max": 3800.0
678
+ },
679
+ {
680
+ "current": 2000.0,
681
+ "min": 800.0,
682
+ "max": 3800.0
683
+ },
684
+ {
685
+ "current": 2000.0,
686
+ "min": 800.0,
687
+ "max": 3800.0
688
+ },
689
+ {
690
+ "current": 2000.0,
691
+ "min": 800.0,
692
+ "max": 3800.0
693
+ },
694
+ {
695
+ "current": 3000.0,
696
+ "min": 800.0,
697
+ "max": 3800.0
698
+ },
699
+ {
700
+ "current": 2000.0,
701
+ "min": 800.0,
702
+ "max": 3800.0
703
+ },
704
+ {
705
+ "current": 2000.0,
706
+ "min": 800.0,
707
+ "max": 3800.0
708
+ },
709
+ {
710
+ "current": 2000.0,
711
+ "min": 800.0,
712
+ "max": 3800.0
713
+ },
714
+ {
715
+ "current": 2000.0,
716
+ "min": 800.0,
717
+ "max": 3800.0
718
+ },
719
+ {
720
+ "current": 2000.0,
721
+ "min": 800.0,
722
+ "max": 3800.0
723
+ },
724
+ {
725
+ "current": 2000.0,
726
+ "min": 800.0,
727
+ "max": 3800.0
728
+ },
729
+ {
730
+ "current": 2000.0,
731
+ "min": 800.0,
732
+ "max": 3800.0
733
+ },
734
+ {
735
+ "current": 2000.0,
736
+ "min": 800.0,
737
+ "max": 3800.0
738
+ },
739
+ {
740
+ "current": 2000.0,
741
+ "min": 800.0,
742
+ "max": 3800.0
743
+ },
744
+ {
745
+ "current": 2000.0,
746
+ "min": 800.0,
747
+ "max": 3800.0
748
+ },
749
+ {
750
+ "current": 2000.0,
751
+ "min": 800.0,
752
+ "max": 3800.0
753
+ },
754
+ {
755
+ "current": 2000.0,
756
+ "min": 800.0,
757
+ "max": 3800.0
758
+ },
759
+ {
760
+ "current": 2000.0,
761
+ "min": 800.0,
762
+ "max": 3800.0
763
+ },
764
+ {
765
+ "current": 2000.0,
766
+ "min": 800.0,
767
+ "max": 3800.0
768
+ },
769
+ {
770
+ "current": 2000.0,
771
+ "min": 800.0,
772
+ "max": 3800.0
773
+ },
774
+ {
775
+ "current": 2993.46,
776
+ "min": 800.0,
777
+ "max": 3800.0
778
+ },
779
+ {
780
+ "current": 2000.0,
781
+ "min": 800.0,
782
+ "max": 3800.0
783
+ },
784
+ {
785
+ "current": 2000.0,
786
+ "min": 800.0,
787
+ "max": 3800.0
788
+ },
789
+ {
790
+ "current": 2000.0,
791
+ "min": 800.0,
792
+ "max": 3800.0
793
+ },
794
+ {
795
+ "current": 2000.0,
796
+ "min": 800.0,
797
+ "max": 3800.0
798
+ },
799
+ {
800
+ "current": 2000.0,
801
+ "min": 800.0,
802
+ "max": 3800.0
803
+ },
804
+ {
805
+ "current": 2000.0,
806
+ "min": 800.0,
807
+ "max": 3800.0
808
+ },
809
+ {
810
+ "current": 2000.0,
811
+ "min": 800.0,
812
+ "max": 3800.0
813
+ },
814
+ {
815
+ "current": 2000.0,
816
+ "min": 800.0,
817
+ "max": 3800.0
818
+ },
819
+ {
820
+ "current": 2000.0,
821
+ "min": 800.0,
822
+ "max": 3800.0
823
+ },
824
+ {
825
+ "current": 2000.0,
826
+ "min": 800.0,
827
+ "max": 3800.0
828
+ },
829
+ {
830
+ "current": 2000.0,
831
+ "min": 800.0,
832
+ "max": 3800.0
833
+ },
834
+ {
835
+ "current": 2000.0,
836
+ "min": 800.0,
837
+ "max": 3800.0
838
+ },
839
+ {
840
+ "current": 2000.0,
841
+ "min": 800.0,
842
+ "max": 3800.0
843
+ },
844
+ {
845
+ "current": 2000.0,
846
+ "min": 800.0,
847
+ "max": 3800.0
848
+ },
849
+ {
850
+ "current": 2000.0,
851
+ "min": 800.0,
852
+ "max": 3800.0
853
+ },
854
+ {
855
+ "current": 2000.0,
856
+ "min": 800.0,
857
+ "max": 3800.0
858
+ },
859
+ {
860
+ "current": 2000.0,
861
+ "min": 800.0,
862
+ "max": 3800.0
863
+ },
864
+ {
865
+ "current": 2000.0,
866
+ "min": 800.0,
867
+ "max": 3800.0
868
+ },
869
+ {
870
+ "current": 2000.0,
871
+ "min": 800.0,
872
+ "max": 3800.0
873
+ },
874
+ {
875
+ "current": 2000.0,
876
+ "min": 800.0,
877
+ "max": 3800.0
878
+ },
879
+ {
880
+ "current": 2000.0,
881
+ "min": 800.0,
882
+ "max": 3800.0
883
+ },
884
+ {
885
+ "current": 2000.0,
886
+ "min": 800.0,
887
+ "max": 3800.0
888
+ },
889
+ {
890
+ "current": 2000.0,
891
+ "min": 800.0,
892
+ "max": 3800.0
893
+ },
894
+ {
895
+ "current": 2000.0,
896
+ "min": 800.0,
897
+ "max": 3800.0
898
+ },
899
+ {
900
+ "current": 2899.998,
901
+ "min": 800.0,
902
+ "max": 3800.0
903
+ },
904
+ {
905
+ "current": 2000.0,
906
+ "min": 800.0,
907
+ "max": 3800.0
908
+ },
909
+ {
910
+ "current": 2000.0,
911
+ "min": 800.0,
912
+ "max": 3800.0
913
+ },
914
+ {
915
+ "current": 2000.0,
916
+ "min": 800.0,
917
+ "max": 3800.0
918
+ },
919
+ {
920
+ "current": 2000.0,
921
+ "min": 800.0,
922
+ "max": 3800.0
923
+ },
924
+ {
925
+ "current": 2000.0,
926
+ "min": 800.0,
927
+ "max": 3800.0
928
+ },
929
+ {
930
+ "current": 2000.0,
931
+ "min": 800.0,
932
+ "max": 3800.0
933
+ },
934
+ {
935
+ "current": 2000.0,
936
+ "min": 800.0,
937
+ "max": 3800.0
938
+ },
939
+ {
940
+ "current": 2000.0,
941
+ "min": 800.0,
942
+ "max": 3800.0
943
+ },
944
+ {
945
+ "current": 2000.0,
946
+ "min": 800.0,
947
+ "max": 3800.0
948
+ },
949
+ {
950
+ "current": 2000.0,
951
+ "min": 800.0,
952
+ "max": 3800.0
953
+ },
954
+ {
955
+ "current": 2000.0,
956
+ "min": 800.0,
957
+ "max": 3800.0
958
+ },
959
+ {
960
+ "current": 2000.0,
961
+ "min": 800.0,
962
+ "max": 3800.0
963
+ },
964
+ {
965
+ "current": 2000.0,
966
+ "min": 800.0,
967
+ "max": 3800.0
968
+ },
969
+ {
970
+ "current": 2000.0,
971
+ "min": 800.0,
972
+ "max": 3800.0
973
+ },
974
+ {
975
+ "current": 2000.0,
976
+ "min": 800.0,
977
+ "max": 3800.0
978
+ },
979
+ {
980
+ "current": 2000.0,
981
+ "min": 800.0,
982
+ "max": 3800.0
983
+ },
984
+ {
985
+ "current": 2000.0,
986
+ "min": 800.0,
987
+ "max": 3800.0
988
+ },
989
+ {
990
+ "current": 2000.0,
991
+ "min": 800.0,
992
+ "max": 3800.0
993
+ },
994
+ {
995
+ "current": 2000.0,
996
+ "min": 800.0,
997
+ "max": 3800.0
998
+ },
999
+ {
1000
+ "current": 2000.0,
1001
+ "min": 800.0,
1002
+ "max": 3800.0
1003
+ },
1004
+ {
1005
+ "current": 2000.0,
1006
+ "min": 800.0,
1007
+ "max": 3800.0
1008
+ },
1009
+ {
1010
+ "current": 2000.0,
1011
+ "min": 800.0,
1012
+ "max": 3800.0
1013
+ },
1014
+ {
1015
+ "current": 2000.0,
1016
+ "min": 800.0,
1017
+ "max": 3800.0
1018
+ },
1019
+ {
1020
+ "current": 2000.0,
1021
+ "min": 800.0,
1022
+ "max": 3800.0
1023
+ },
1024
+ {
1025
+ "current": 2000.0,
1026
+ "min": 800.0,
1027
+ "max": 3800.0
1028
+ },
1029
+ {
1030
+ "current": 2000.0,
1031
+ "min": 800.0,
1032
+ "max": 3800.0
1033
+ },
1034
+ {
1035
+ "current": 2000.0,
1036
+ "min": 800.0,
1037
+ "max": 3800.0
1038
+ },
1039
+ {
1040
+ "current": 2000.0,
1041
+ "min": 800.0,
1042
+ "max": 3800.0
1043
+ },
1044
+ {
1045
+ "current": 2000.0,
1046
+ "min": 800.0,
1047
+ "max": 3800.0
1048
+ },
1049
+ {
1050
+ "current": 2000.0,
1051
+ "min": 800.0,
1052
+ "max": 3800.0
1053
+ },
1054
+ {
1055
+ "current": 2000.0,
1056
+ "min": 800.0,
1057
+ "max": 3800.0
1058
+ },
1059
+ {
1060
+ "current": 2000.0,
1061
+ "min": 800.0,
1062
+ "max": 3800.0
1063
+ },
1064
+ {
1065
+ "current": 2000.0,
1066
+ "min": 800.0,
1067
+ "max": 3800.0
1068
+ },
1069
+ {
1070
+ "current": 2000.0,
1071
+ "min": 800.0,
1072
+ "max": 3800.0
1073
+ },
1074
+ {
1075
+ "current": 2000.0,
1076
+ "min": 800.0,
1077
+ "max": 3800.0
1078
+ },
1079
+ {
1080
+ "current": 2000.0,
1081
+ "min": 800.0,
1082
+ "max": 3800.0
1083
+ },
1084
+ {
1085
+ "current": 2000.0,
1086
+ "min": 800.0,
1087
+ "max": 3800.0
1088
+ },
1089
+ {
1090
+ "current": 2000.0,
1091
+ "min": 800.0,
1092
+ "max": 3800.0
1093
+ },
1094
+ {
1095
+ "current": 2000.0,
1096
+ "min": 800.0,
1097
+ "max": 3800.0
1098
+ },
1099
+ {
1100
+ "current": 2000.0,
1101
+ "min": 800.0,
1102
+ "max": 3800.0
1103
+ },
1104
+ {
1105
+ "current": 2000.0,
1106
+ "min": 800.0,
1107
+ "max": 3800.0
1108
+ },
1109
+ {
1110
+ "current": 2000.0,
1111
+ "min": 800.0,
1112
+ "max": 3800.0
1113
+ },
1114
+ {
1115
+ "current": 2000.0,
1116
+ "min": 800.0,
1117
+ "max": 3800.0
1118
+ },
1119
+ {
1120
+ "current": 2000.0,
1121
+ "min": 800.0,
1122
+ "max": 3800.0
1123
+ },
1124
+ {
1125
+ "current": 2000.0,
1126
+ "min": 800.0,
1127
+ "max": 3800.0
1128
+ },
1129
+ {
1130
+ "current": 2000.0,
1131
+ "min": 800.0,
1132
+ "max": 3800.0
1133
+ },
1134
+ {
1135
+ "current": 2000.0,
1136
+ "min": 800.0,
1137
+ "max": 3800.0
1138
+ },
1139
+ {
1140
+ "current": 2000.0,
1141
+ "min": 800.0,
1142
+ "max": 3800.0
1143
+ },
1144
+ {
1145
+ "current": 2000.0,
1146
+ "min": 800.0,
1147
+ "max": 3800.0
1148
+ },
1149
+ {
1150
+ "current": 2000.0,
1151
+ "min": 800.0,
1152
+ "max": 3800.0
1153
+ },
1154
+ {
1155
+ "current": 2000.0,
1156
+ "min": 800.0,
1157
+ "max": 3800.0
1158
+ },
1159
+ {
1160
+ "current": 2000.0,
1161
+ "min": 800.0,
1162
+ "max": 3800.0
1163
+ },
1164
+ {
1165
+ "current": 2000.0,
1166
+ "min": 800.0,
1167
+ "max": 3800.0
1168
+ }
1169
+ ],
1170
+ "disk": {
1171
+ "/": {
1172
+ "total": 1758.8549690246582,
1173
+ "used": 114.61069869995117
1174
+ }
1175
+ },
1176
+ "gpu": "NVIDIA H800",
1177
+ "gpu_count": 8,
1178
+ "gpu_devices": [
1179
+ {
1180
+ "name": "NVIDIA H800",
1181
+ "memory_total": 85520809984
1182
+ },
1183
+ {
1184
+ "name": "NVIDIA H800",
1185
+ "memory_total": 85520809984
1186
+ },
1187
+ {
1188
+ "name": "NVIDIA H800",
1189
+ "memory_total": 85520809984
1190
+ },
1191
+ {
1192
+ "name": "NVIDIA H800",
1193
+ "memory_total": 85520809984
1194
+ },
1195
+ {
1196
+ "name": "NVIDIA H800",
1197
+ "memory_total": 85520809984
1198
+ },
1199
+ {
1200
+ "name": "NVIDIA H800",
1201
+ "memory_total": 85520809984
1202
+ },
1203
+ {
1204
+ "name": "NVIDIA H800",
1205
+ "memory_total": 85520809984
1206
+ },
1207
+ {
1208
+ "name": "NVIDIA H800",
1209
+ "memory_total": 85520809984
1210
+ }
1211
+ ],
1212
+ "memory": {
1213
+ "total": 2015.564224243164
1214
+ }
1215
+ }
wandb/run-20240921_115259-p9bvnzls/files/wandb-summary.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"train/step": 166, "train/loss": 2.49491810798645, "train/reward": -24.865015029907227, "train/better_sample_reward": -12.784756660461426, "train/worse_sample_reward": -12.080260276794434, "train/reward_accuracy": 0.625, "train/reward_margin": -0.7044967412948608, "train/lr": 7.861083133307247e-07, "train/epoch": 0.9378531073446328, "_timestamp": 1726892593.1315699, "_runtime": 1813.9295139312744, "_step": 166}
wandb/run-20240921_115259-p9bvnzls/logs/debug-internal.log ADDED
The diff for this file is too large to render. See raw diff