Add files using upload-large-folder tool
Browse files- 0417_reward.py +500 -0
- 0417train.sh +75 -0
- wandb/debug-internal.log +72 -0
- wandb/debug.log +26 -0
- wandb/run-20260417_122253-6ntp64iz/files/output.log +0 -0
- wandb/run-20260417_122253-6ntp64iz/files/requirements.txt +255 -0
- wandb/run-20260417_122253-6ntp64iz/files/wandb-metadata.json +223 -0
- wandb/run-20260417_122253-6ntp64iz/files/wandb-summary.json +1 -0
- wandb/run-20260417_122253-6ntp64iz/logs/debug-core.log +12 -0
- wandb/run-20260417_122253-6ntp64iz/logs/debug-internal.log +7 -0
- wandb/run-20260417_122253-6ntp64iz/logs/debug.log +26 -0
- wandb/run-20260417_123237-3h84yfea/files/config.yaml +1272 -0
- wandb/run-20260417_123237-3h84yfea/files/media/table/completions_1_e5129c1db5b8522d8aa7.table.json +1 -0
- wandb/run-20260417_123237-3h84yfea/files/media/table/completions_3_0656117578a4523e0161.table.json +1 -0
- wandb/run-20260417_123237-3h84yfea/files/media/table/completions_5_f2bf6a8e887194296a09.table.json +1 -0
- wandb/run-20260417_123237-3h84yfea/files/media/table/completions_7_4930391b310cfe338705.table.json +1 -0
- wandb/run-20260417_123237-3h84yfea/files/media/table/completions_9_ec21142175e3781c9ddd.table.json +1 -0
- wandb/run-20260417_123237-3h84yfea/files/output.log +326 -0
- wandb/run-20260417_123237-3h84yfea/files/requirements.txt +255 -0
- wandb/run-20260417_123237-3h84yfea/files/wandb-metadata.json +223 -0
- wandb/run-20260417_123237-3h84yfea/files/wandb-summary.json +1 -0
- wandb/run-20260417_123237-3h84yfea/logs/debug-core.log +14 -0
- wandb/run-20260417_123237-3h84yfea/logs/debug-internal.log +14 -0
- wandb/run-20260417_123237-3h84yfea/logs/debug.log +26 -0
- wandb/run-20260417_125349-3c0s7mq3/files/config.yaml +1273 -0
- wandb/run-20260417_125349-3c0s7mq3/files/media/table/completions_1_1de95d5626025fdbb34e.table.json +1 -0
- wandb/run-20260417_125349-3c0s7mq3/files/media/table/completions_3_b8120af2e2a4bc038eb5.table.json +1 -0
- wandb/run-20260417_125349-3c0s7mq3/files/media/table/completions_5_510c5f07b145276e4210.table.json +1 -0
- wandb/run-20260417_125349-3c0s7mq3/files/output.log +76 -0
- wandb/run-20260417_125349-3c0s7mq3/files/requirements.txt +255 -0
- wandb/run-20260417_125349-3c0s7mq3/files/wandb-metadata.json +224 -0
- wandb/run-20260417_125349-3c0s7mq3/files/wandb-summary.json +1 -0
- wandb/run-20260417_125349-3c0s7mq3/logs/debug-core.log +11 -0
- wandb/run-20260417_125349-3c0s7mq3/logs/debug-internal.log +11 -0
- wandb/run-20260417_125349-3c0s7mq3/logs/debug.log +26 -0
- wandb/run-20260418_172847-c2a5hfz3/files/config.yaml +1262 -0
- wandb/run-20260418_172847-c2a5hfz3/files/media/table/completions_291_2ce0194cf48cadccd2a9.table.json +1 -0
- wandb/run-20260418_172847-c2a5hfz3/files/media/table/completions_297_2c3b42b29065c75ff192.table.json +1 -0
- wandb/run-20260418_172847-c2a5hfz3/files/media/table/completions_325_dedd0bb2cd2d27e14a92.table.json +1 -0
- wandb/run-20260418_172847-c2a5hfz3/files/media/table/completions_331_10c4aed0f625c56bd04d.table.json +1 -0
- wandb/run-20260418_172847-c2a5hfz3/files/media/table/completions_335_3461640c297d6819a123.table.json +1 -0
- wandb/run-20260418_172847-c2a5hfz3/files/media/table/completions_411_885808c4b4bd708583eb.table.json +1 -0
- wandb/run-20260418_172847-c2a5hfz3/files/media/table/completions_43_9ca1008a424f8bb91c1c.table.json +1 -0
- wandb/run-20260418_172847-c2a5hfz3/files/media/table/completions_63_9c15897616f0ff0b68b9.table.json +1 -0
- wandb/run-20260418_172847-c2a5hfz3/files/output.log +0 -0
- wandb/run-20260418_172847-c2a5hfz3/files/requirements.txt +255 -0
- wandb/run-20260418_172847-c2a5hfz3/files/wandb-metadata.json +213 -0
- wandb/run-20260418_172847-c2a5hfz3/files/wandb-summary.json +1 -0
- wandb/run-20260418_172847-c2a5hfz3/logs/debug-internal.log +72 -0
- wandb/run-20260418_172847-c2a5hfz3/logs/debug.log +26 -0
0417_reward.py
ADDED
|
@@ -0,0 +1,500 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
# asr_RL_reward_v56_dirty.py
|
| 2 |
+
# -*- coding: utf-8 -*-
|
| 3 |
+
|
| 4 |
+
import re
|
| 5 |
+
import json
|
| 6 |
+
import os
|
| 7 |
+
import time
|
| 8 |
+
from functools import lru_cache
|
| 9 |
+
from collections import Counter
|
| 10 |
+
from typing import Any, Dict, List, Tuple
|
| 11 |
+
|
| 12 |
+
try:
|
| 13 |
+
from swift.rewards import ORM, orms
|
| 14 |
+
except Exception:
|
| 15 |
+
from swift.plugin import ORM, orms
|
| 16 |
+
|
| 17 |
+
from qwen_asr.inference.utils import parse_asr_output
|
| 18 |
+
|
| 19 |
+
_ANSWER_RE = re.compile(r"<answer>(.*?)</answer>", re.S | re.I)
|
| 20 |
+
_REWARD_DEBUG_COUNTER: Dict[str, int] = {}
|
| 21 |
+
|
| 22 |
+
|
| 23 |
+
def _as_bool(x, default: bool = False) -> bool:
|
| 24 |
+
if x is None:
|
| 25 |
+
return default
|
| 26 |
+
if isinstance(x, bool):
|
| 27 |
+
return x
|
| 28 |
+
if isinstance(x, (int, float)):
|
| 29 |
+
return bool(x)
|
| 30 |
+
return str(x).strip().lower() in {"1", "true", "yes", "y", "on"}
|
| 31 |
+
|
| 32 |
+
|
| 33 |
+
def _to_jsonable(x: Any):
|
| 34 |
+
if x is None or isinstance(x, (str, int, float, bool)):
|
| 35 |
+
return x
|
| 36 |
+
if isinstance(x, (list, tuple)):
|
| 37 |
+
return [_to_jsonable(v) for v in x]
|
| 38 |
+
if isinstance(x, dict):
|
| 39 |
+
return {str(k): _to_jsonable(v) for k, v in x.items()}
|
| 40 |
+
return str(x)
|
| 41 |
+
|
| 42 |
+
|
| 43 |
+
def _pick_field(x, i: int):
|
| 44 |
+
if x is None:
|
| 45 |
+
return None
|
| 46 |
+
if isinstance(x, (list, tuple)):
|
| 47 |
+
return x[i] if i < len(x) else None
|
| 48 |
+
return x
|
| 49 |
+
|
| 50 |
+
|
| 51 |
+
def _reward_debug_enabled(kwargs) -> bool:
|
| 52 |
+
if "reward_debug" in kwargs:
|
| 53 |
+
return _as_bool(kwargs.get("reward_debug"), default=False)
|
| 54 |
+
return _as_bool(os.environ.get("ASR_REWARD_DEBUG"), default=False)
|
| 55 |
+
|
| 56 |
+
|
| 57 |
+
def _reward_debug_path(kwargs, reward_name: str) -> str:
|
| 58 |
+
base = kwargs.get("reward_debug_path") or os.environ.get("ASR_REWARD_DEBUG_PATH")
|
| 59 |
+
if not base:
|
| 60 |
+
return ""
|
| 61 |
+
base = str(base)
|
| 62 |
+
if base.endswith(".jsonl"):
|
| 63 |
+
base = base[:-6]
|
| 64 |
+
return f"{base}.{reward_name}.pid{os.getpid()}.jsonl"
|
| 65 |
+
|
| 66 |
+
|
| 67 |
+
def _reward_debug_max_rows(kwargs) -> int:
|
| 68 |
+
x = kwargs.get("reward_debug_max_rows")
|
| 69 |
+
if x is None:
|
| 70 |
+
x = os.environ.get("ASR_REWARD_DEBUG_MAX_ROWS", 1000)
|
| 71 |
+
try:
|
| 72 |
+
x = int(x)
|
| 73 |
+
except Exception:
|
| 74 |
+
x = 1000
|
| 75 |
+
return max(0, x)
|
| 76 |
+
|
| 77 |
+
|
| 78 |
+
def _collect_common_debug_meta(kwargs, i: int) -> Dict[str, Any]:
|
| 79 |
+
fields = [
|
| 80 |
+
"step", "id", "sample_id", "group_id", "utt_id", "audio_id", "audio_path",
|
| 81 |
+
"task", "lang", "language", "base_wer", "base_wer_bucket", "difficulty_bucket", "wer",
|
| 82 |
+
"dirty_type",
|
| 83 |
+
]
|
| 84 |
+
out = {}
|
| 85 |
+
for k in fields:
|
| 86 |
+
if k in kwargs:
|
| 87 |
+
out[k] = _to_jsonable(_pick_field(kwargs.get(k), i))
|
| 88 |
+
return out
|
| 89 |
+
|
| 90 |
+
|
| 91 |
+
def _append_reward_debug_row(reward_name: str, kwargs, row: Dict[str, Any]) -> None:
|
| 92 |
+
if not _reward_debug_enabled(kwargs):
|
| 93 |
+
return
|
| 94 |
+
path = _reward_debug_path(kwargs, reward_name)
|
| 95 |
+
if not path:
|
| 96 |
+
return
|
| 97 |
+
max_rows = _reward_debug_max_rows(kwargs)
|
| 98 |
+
if max_rows <= 0:
|
| 99 |
+
return
|
| 100 |
+
cur = _REWARD_DEBUG_COUNTER.get(path, 0)
|
| 101 |
+
if cur >= max_rows:
|
| 102 |
+
return
|
| 103 |
+
try:
|
| 104 |
+
parent = os.path.dirname(path)
|
| 105 |
+
if parent:
|
| 106 |
+
os.makedirs(parent, exist_ok=True)
|
| 107 |
+
payload = {
|
| 108 |
+
"ts": time.time(),
|
| 109 |
+
"reward_name": reward_name,
|
| 110 |
+
**_to_jsonable(row),
|
| 111 |
+
}
|
| 112 |
+
with open(path, "a", encoding="utf-8") as f:
|
| 113 |
+
f.write(json.dumps(payload, ensure_ascii=False) + "\n")
|
| 114 |
+
_REWARD_DEBUG_COUNTER[path] = cur + 1
|
| 115 |
+
except Exception:
|
| 116 |
+
pass
|
| 117 |
+
|
| 118 |
+
|
| 119 |
+
def _extract_completion_text(s: str) -> str:
|
| 120 |
+
if s is None:
|
| 121 |
+
return ""
|
| 122 |
+
s = s.strip()
|
| 123 |
+
m = _ANSWER_RE.search(s)
|
| 124 |
+
if m:
|
| 125 |
+
s = m.group(1).strip()
|
| 126 |
+
lower = s.lower()
|
| 127 |
+
for pfx in ["transcription:", "asr:", "answer:", "答案:", "答案:", "识别结果:", "识别结果:"]:
|
| 128 |
+
if lower.startswith(pfx):
|
| 129 |
+
s = s[len(pfx):].strip()
|
| 130 |
+
break
|
| 131 |
+
s = s.replace("<|im_end|>", "").strip()
|
| 132 |
+
try:
|
| 133 |
+
_lang, text = parse_asr_output(s, user_language=None)
|
| 134 |
+
if text:
|
| 135 |
+
s = text
|
| 136 |
+
except Exception:
|
| 137 |
+
pass
|
| 138 |
+
return s
|
| 139 |
+
|
| 140 |
+
|
| 141 |
+
def normalize_text(s: str) -> str:
|
| 142 |
+
return (s or "").strip().lower()
|
| 143 |
+
|
| 144 |
+
|
| 145 |
+
@lru_cache(maxsize=50000)
|
| 146 |
+
def _tokenize_cached(s: str) -> Tuple[str, ...]:
|
| 147 |
+
s = normalize_text(s)
|
| 148 |
+
if not s:
|
| 149 |
+
return tuple()
|
| 150 |
+
if " " in s:
|
| 151 |
+
return tuple(w for w in s.split() if w)
|
| 152 |
+
return tuple(ch for ch in s if not ch.isspace())
|
| 153 |
+
|
| 154 |
+
|
| 155 |
+
def _tokenize(s: str) -> List[str]:
|
| 156 |
+
return list(_tokenize_cached(s))
|
| 157 |
+
|
| 158 |
+
|
| 159 |
+
def _char_seq(s: str) -> List[str]:
|
| 160 |
+
s = normalize_text(s)
|
| 161 |
+
return [ch for ch in s if not ch.isspace()]
|
| 162 |
+
|
| 163 |
+
|
| 164 |
+
def _infer_dirty_type_from_audio(x: Any) -> str:
|
| 165 |
+
if x is None:
|
| 166 |
+
return "other"
|
| 167 |
+
if isinstance(x, (list, tuple)) and len(x) > 0:
|
| 168 |
+
x = x[0]
|
| 169 |
+
s = str(x).lower()
|
| 170 |
+
if "voices" in s:
|
| 171 |
+
return "voices_noise_plus_farfield"
|
| 172 |
+
if "noise+rsp" in s or "resample_noise" in s or ("/noise/" in s and "voices" not in s):
|
| 173 |
+
return "noise_rsp_pure_noise"
|
| 174 |
+
return "other"
|
| 175 |
+
|
| 176 |
+
|
| 177 |
+
def _get_dirty_type(kwargs, i: int) -> str:
|
| 178 |
+
dtype = _pick_field(kwargs.get("dirty_type"), i)
|
| 179 |
+
if dtype is not None:
|
| 180 |
+
s = str(dtype).strip().lower()
|
| 181 |
+
if s in {"voices", "voices_noise_plus_farfield", "voices_far", "voices_farfield"}:
|
| 182 |
+
return "voices_noise_plus_farfield"
|
| 183 |
+
if s in {"noise", "noise_rsp", "noise_rsp_pure_noise", "pure_noise"}:
|
| 184 |
+
return "noise_rsp_pure_noise"
|
| 185 |
+
return s
|
| 186 |
+
|
| 187 |
+
audio_path = _pick_field(kwargs.get("audio_path"), i)
|
| 188 |
+
if audio_path is not None:
|
| 189 |
+
return _infer_dirty_type_from_audio(audio_path)
|
| 190 |
+
|
| 191 |
+
audios = _pick_field(kwargs.get("audios"), i)
|
| 192 |
+
return _infer_dirty_type_from_audio(audios)
|
| 193 |
+
|
| 194 |
+
|
| 195 |
+
def _edit_ops_counts(ref_toks: List[str], hyp_toks: List[str]) -> Tuple[int, int, int]:
|
| 196 |
+
n, m = len(ref_toks), len(hyp_toks)
|
| 197 |
+
dp = [[0] * (m + 1) for _ in range(n + 1)]
|
| 198 |
+
bt = [[0] * (m + 1) for _ in range(n + 1)]
|
| 199 |
+
|
| 200 |
+
for i in range(1, n + 1):
|
| 201 |
+
dp[i][0] = i
|
| 202 |
+
bt[i][0] = 2
|
| 203 |
+
for j in range(1, m + 1):
|
| 204 |
+
dp[0][j] = j
|
| 205 |
+
bt[0][j] = 3
|
| 206 |
+
|
| 207 |
+
for i in range(1, n + 1):
|
| 208 |
+
ri = ref_toks[i - 1]
|
| 209 |
+
for j in range(1, m + 1):
|
| 210 |
+
hj = hyp_toks[j - 1]
|
| 211 |
+
if ri == hj:
|
| 212 |
+
dp[i][j] = dp[i - 1][j - 1]
|
| 213 |
+
bt[i][j] = 0
|
| 214 |
+
else:
|
| 215 |
+
sub = dp[i - 1][j - 1] + 1
|
| 216 |
+
dele = dp[i - 1][j] + 1
|
| 217 |
+
ins = dp[i][j - 1] + 1
|
| 218 |
+
best = min(sub, dele, ins)
|
| 219 |
+
dp[i][j] = best
|
| 220 |
+
if best == sub:
|
| 221 |
+
bt[i][j] = 1
|
| 222 |
+
elif best == dele:
|
| 223 |
+
bt[i][j] = 2
|
| 224 |
+
else:
|
| 225 |
+
bt[i][j] = 3
|
| 226 |
+
|
| 227 |
+
i, j = n, m
|
| 228 |
+
sub = dele = ins = 0
|
| 229 |
+
while i > 0 or j > 0:
|
| 230 |
+
op = bt[i][j]
|
| 231 |
+
if i > 0 and j > 0 and op == 0:
|
| 232 |
+
i -= 1
|
| 233 |
+
j -= 1
|
| 234 |
+
elif i > 0 and j > 0 and op == 1:
|
| 235 |
+
sub += 1
|
| 236 |
+
i -= 1
|
| 237 |
+
j -= 1
|
| 238 |
+
elif i > 0 and op == 2:
|
| 239 |
+
dele += 1
|
| 240 |
+
i -= 1
|
| 241 |
+
else:
|
| 242 |
+
ins += 1
|
| 243 |
+
j -= 1
|
| 244 |
+
return sub, dele, ins
|
| 245 |
+
|
| 246 |
+
|
| 247 |
+
def _char_bigram_f1(hyp: str, ref: str) -> float:
|
| 248 |
+
h = _char_seq(hyp)
|
| 249 |
+
r = _char_seq(ref)
|
| 250 |
+
if not h and not r:
|
| 251 |
+
return 1.0
|
| 252 |
+
if not h or not r:
|
| 253 |
+
return 0.0
|
| 254 |
+
if len(h) < 2 or len(r) < 2:
|
| 255 |
+
inter = sum(1 for x, y in zip(h, r) if x == y)
|
| 256 |
+
p = inter / max(1, len(h))
|
| 257 |
+
rr = inter / max(1, len(r))
|
| 258 |
+
return 2.0 * p * rr / max(1e-8, p + rr)
|
| 259 |
+
|
| 260 |
+
hg = Counter((h[i], h[i + 1]) for i in range(len(h) - 1))
|
| 261 |
+
rg = Counter((r[i], r[i + 1]) for i in range(len(r) - 1))
|
| 262 |
+
inter = sum(min(v, rg[k]) for k, v in hg.items())
|
| 263 |
+
p = inter / max(1, sum(hg.values()))
|
| 264 |
+
rr = inter / max(1, sum(rg.values()))
|
| 265 |
+
return 2.0 * p * rr / max(1e-8, p + rr)
|
| 266 |
+
|
| 267 |
+
|
| 268 |
+
def _lcs_lengths(hyp: str, ref: str) -> Tuple[int, int, int]:
|
| 269 |
+
h = _char_seq(hyp)
|
| 270 |
+
r = _char_seq(ref)
|
| 271 |
+
n, m = len(r), len(h)
|
| 272 |
+
if n == 0 or m == 0:
|
| 273 |
+
return 0, n, m
|
| 274 |
+
prev = [0] * (m + 1)
|
| 275 |
+
for i in range(1, n + 1):
|
| 276 |
+
cur = [0] * (m + 1)
|
| 277 |
+
ri = r[i - 1]
|
| 278 |
+
for j in range(1, m + 1):
|
| 279 |
+
if ri == h[j - 1]:
|
| 280 |
+
cur[j] = prev[j - 1] + 1
|
| 281 |
+
else:
|
| 282 |
+
cur[j] = max(prev[j], cur[j - 1])
|
| 283 |
+
prev = cur
|
| 284 |
+
return prev[m], n, m
|
| 285 |
+
|
| 286 |
+
|
| 287 |
+
def _lcs_f1(hyp: str, ref: str) -> float:
|
| 288 |
+
lcs_len, ref_len, hyp_len = _lcs_lengths(hyp, ref)
|
| 289 |
+
if ref_len == 0 and hyp_len == 0:
|
| 290 |
+
return 1.0
|
| 291 |
+
if ref_len == 0 or hyp_len == 0:
|
| 292 |
+
return 0.0
|
| 293 |
+
p = lcs_len / max(1, hyp_len)
|
| 294 |
+
r = lcs_len / max(1, ref_len)
|
| 295 |
+
return 2.0 * p * r / max(1e-8, p + r)
|
| 296 |
+
|
| 297 |
+
|
| 298 |
+
def _cmp_score(hyp: str, ref: str) -> float:
|
| 299 |
+
return 0.70 * _char_bigram_f1(hyp, ref) + 0.30 * _lcs_f1(hyp, ref)
|
| 300 |
+
|
| 301 |
+
|
| 302 |
+
def wer_reward_main(wer: float) -> float:
|
| 303 |
+
if wer <= 0.15:
|
| 304 |
+
return 1.0 - 1.8 * wer
|
| 305 |
+
elif wer <= 0.35:
|
| 306 |
+
return 0.73 - 2.3 * (wer - 0.15)
|
| 307 |
+
elif wer <= 0.70:
|
| 308 |
+
return 0.27 - 2.4 * (wer - 0.35)
|
| 309 |
+
elif wer <= 1.20:
|
| 310 |
+
return -0.57 - 0.70 * (wer - 0.70)
|
| 311 |
+
else:
|
| 312 |
+
return -0.92
|
| 313 |
+
|
| 314 |
+
|
| 315 |
+
def length_ratio_penalty_v3(
|
| 316 |
+
hyp_len: int,
|
| 317 |
+
ref_len: int,
|
| 318 |
+
soft_min: float = 0.90,
|
| 319 |
+
soft_max: float = 1.10,
|
| 320 |
+
hard_min: float = 0.78,
|
| 321 |
+
hard_max: float = 1.30,
|
| 322 |
+
soft_penalty: float = 0.10,
|
| 323 |
+
hard_penalty: float = 0.36,
|
| 324 |
+
) -> float:
|
| 325 |
+
ref_len = max(1, ref_len)
|
| 326 |
+
ratio = hyp_len / ref_len
|
| 327 |
+
if soft_min <= ratio <= soft_max:
|
| 328 |
+
return 0.0
|
| 329 |
+
if hard_min <= ratio < soft_min:
|
| 330 |
+
frac = (soft_min - ratio) / max(1e-6, soft_min - hard_min)
|
| 331 |
+
return -soft_penalty * frac
|
| 332 |
+
if soft_max < ratio <= hard_max:
|
| 333 |
+
frac = (ratio - soft_max) / max(1e-6, hard_max - soft_max)
|
| 334 |
+
return -soft_penalty * frac
|
| 335 |
+
if ratio < hard_min:
|
| 336 |
+
frac = min(1.0, (hard_min - ratio) / max(1e-6, hard_min))
|
| 337 |
+
return -(soft_penalty + (hard_penalty - soft_penalty) * frac)
|
| 338 |
+
frac = min(1.0, (ratio - hard_max) / max(1e-6, hard_max))
|
| 339 |
+
return -(soft_penalty + (hard_penalty - soft_penalty) * frac)
|
| 340 |
+
|
| 341 |
+
|
| 342 |
+
def tail_penalty(len_ratio: float) -> float:
|
| 343 |
+
if len_ratio <= 1.15:
|
| 344 |
+
return 0.0
|
| 345 |
+
if len_ratio <= 1.40:
|
| 346 |
+
return -0.28 * (len_ratio - 1.15) / 0.25
|
| 347 |
+
if len_ratio <= 2.0:
|
| 348 |
+
return -0.28 - 0.42 * (len_ratio - 1.40) / 0.60
|
| 349 |
+
return -0.70
|
| 350 |
+
|
| 351 |
+
|
| 352 |
+
def is_hallucination_v56(hyp_toks: List[str], ref_toks: List[str], wer: float, len_ratio: float):
|
| 353 |
+
if len(hyp_toks) == 0:
|
| 354 |
+
return True, "empty"
|
| 355 |
+
|
| 356 |
+
run = 1
|
| 357 |
+
for i in range(1, len(hyp_toks)):
|
| 358 |
+
run = run + 1 if hyp_toks[i] == hyp_toks[i - 1] else 1
|
| 359 |
+
if run >= 5:
|
| 360 |
+
return True, "repeat_run>=5"
|
| 361 |
+
|
| 362 |
+
if len(hyp_toks) >= 8:
|
| 363 |
+
bigrams = [(hyp_toks[i], hyp_toks[i + 1]) for i in range(len(hyp_toks) - 1)]
|
| 364 |
+
c = Counter(bigrams)
|
| 365 |
+
most = c.most_common(1)[0][1]
|
| 366 |
+
if most / max(1, len(bigrams)) > 0.22:
|
| 367 |
+
return True, "repeat_bigram>0.22"
|
| 368 |
+
|
| 369 |
+
if len_ratio > 1.60:
|
| 370 |
+
return True, "len_ratio>1.60"
|
| 371 |
+
|
| 372 |
+
if wer >= 1.20:
|
| 373 |
+
return True, "wer>=1.20"
|
| 374 |
+
|
| 375 |
+
return False, "ok"
|
| 376 |
+
|
| 377 |
+
|
| 378 |
+
def _voices_residual(del_rate: float, len_ratio: float):
|
| 379 |
+
p_del_voice = -0.12 * del_rate - 0.08 * max(0.0, del_rate - 0.10)
|
| 380 |
+
p_under_voice = -0.06 * max(0.0, 0.98 - len_ratio)
|
| 381 |
+
return p_del_voice, p_under_voice
|
| 382 |
+
|
| 383 |
+
|
| 384 |
+
def _noise_residual(sub_rate: float, cmp_score: float):
|
| 385 |
+
p_sub_noise = -0.08 * sub_rate
|
| 386 |
+
p_cmp_noise = -0.04 * (1.0 - cmp_score)
|
| 387 |
+
return p_sub_noise, p_cmp_noise
|
| 388 |
+
|
| 389 |
+
|
| 390 |
+
class ASRWerSubLenCmpHalluDirtyV56(ORM):
|
| 391 |
+
sub_penalty_a = 0.40
|
| 392 |
+
sub_penalty_b = 0.35
|
| 393 |
+
cmp_penalty = 0.14
|
| 394 |
+
hallu_extra_penalty = 0.42
|
| 395 |
+
empty_extra_penalty = 0.28
|
| 396 |
+
|
| 397 |
+
reward_clip_min = -4.0
|
| 398 |
+
reward_clip_max = 2.0
|
| 399 |
+
|
| 400 |
+
def __call__(self, completions, solution=None, **kwargs):
|
| 401 |
+
if solution is None:
|
| 402 |
+
solution = kwargs.get("solution")
|
| 403 |
+
if solution is None:
|
| 404 |
+
return [0.0 for _ in completions]
|
| 405 |
+
|
| 406 |
+
if isinstance(solution, str):
|
| 407 |
+
solution_list = [solution for _ in completions]
|
| 408 |
+
else:
|
| 409 |
+
solution_list = list(solution)
|
| 410 |
+
|
| 411 |
+
rewards = []
|
| 412 |
+
for i, (comp, ref) in enumerate(zip(completions, solution_list)):
|
| 413 |
+
hyp = _extract_completion_text(comp)
|
| 414 |
+
ref = ref or ""
|
| 415 |
+
|
| 416 |
+
ref_toks = _tokenize(ref)
|
| 417 |
+
hyp_toks = _tokenize(hyp)
|
| 418 |
+
|
| 419 |
+
ref_len = max(1, len(ref_toks))
|
| 420 |
+
hyp_len = len(hyp_toks)
|
| 421 |
+
len_ratio = float(hyp_len) / float(ref_len)
|
| 422 |
+
|
| 423 |
+
sub_cnt, del_cnt, ins_cnt = _edit_ops_counts(ref_toks, hyp_toks)
|
| 424 |
+
wer = float(sub_cnt + del_cnt + ins_cnt) / float(ref_len)
|
| 425 |
+
|
| 426 |
+
sub_rate = float(sub_cnt) / float(ref_len)
|
| 427 |
+
del_rate = float(del_cnt) / float(ref_len)
|
| 428 |
+
|
| 429 |
+
r_wer = wer_reward_main(wer)
|
| 430 |
+
p_sub = -float(self.sub_penalty_a) * sub_rate - float(self.sub_penalty_b) * max(0.0, sub_rate - 0.35)
|
| 431 |
+
p_len = length_ratio_penalty_v3(hyp_len=hyp_len, ref_len=ref_len)
|
| 432 |
+
p_tail = tail_penalty(len_ratio)
|
| 433 |
+
|
| 434 |
+
cmp_score = _cmp_score(hyp, ref)
|
| 435 |
+
p_cmp = -float(self.cmp_penalty) * (1.0 - cmp_score)
|
| 436 |
+
|
| 437 |
+
hallu, hallu_reason = is_hallucination_v56(hyp_toks, ref_toks, wer, len_ratio)
|
| 438 |
+
p_hallu = -float(self.hallu_extra_penalty) if hallu else 0.0
|
| 439 |
+
p_empty = -float(self.empty_extra_penalty) if hyp_len == 0 else 0.0
|
| 440 |
+
|
| 441 |
+
dirty_type = _get_dirty_type(kwargs, i)
|
| 442 |
+
p_del_voice = 0.0
|
| 443 |
+
p_under_voice = 0.0
|
| 444 |
+
p_sub_noise = 0.0
|
| 445 |
+
p_cmp_noise = 0.0
|
| 446 |
+
|
| 447 |
+
if dirty_type == "voices_noise_plus_farfield":
|
| 448 |
+
p_del_voice, p_under_voice = _voices_residual(del_rate, len_ratio)
|
| 449 |
+
elif dirty_type == "noise_rsp_pure_noise":
|
| 450 |
+
p_sub_noise, p_cmp_noise = _noise_residual(sub_rate, cmp_score)
|
| 451 |
+
|
| 452 |
+
reward_raw = float(
|
| 453 |
+
r_wer + p_sub + p_len + p_tail + p_cmp + p_hallu + p_empty
|
| 454 |
+
+ p_del_voice + p_under_voice + p_sub_noise + p_cmp_noise
|
| 455 |
+
)
|
| 456 |
+
r = max(float(self.reward_clip_min), min(float(self.reward_clip_max), reward_raw))
|
| 457 |
+
rewards.append(r)
|
| 458 |
+
|
| 459 |
+
_append_reward_debug_row(
|
| 460 |
+
reward_name="asr_wer_sub_len_cmp_hallu_dirty_v56",
|
| 461 |
+
kwargs=kwargs,
|
| 462 |
+
row={
|
| 463 |
+
**_collect_common_debug_meta(kwargs, i),
|
| 464 |
+
"index": i,
|
| 465 |
+
"dirty_type_resolved": dirty_type,
|
| 466 |
+
"completion_raw": comp,
|
| 467 |
+
"hyp": hyp,
|
| 468 |
+
"ref": ref,
|
| 469 |
+
"ref_len": ref_len,
|
| 470 |
+
"hyp_len": hyp_len,
|
| 471 |
+
"len_ratio": len_ratio,
|
| 472 |
+
"sub_cnt": sub_cnt,
|
| 473 |
+
"del_cnt": del_cnt,
|
| 474 |
+
"ins_cnt": ins_cnt,
|
| 475 |
+
"wer_calc": wer,
|
| 476 |
+
"sub_rate": sub_rate,
|
| 477 |
+
"del_rate": del_rate,
|
| 478 |
+
"cmp_score": cmp_score,
|
| 479 |
+
"hallu": hallu,
|
| 480 |
+
"hallu_reason": hallu_reason,
|
| 481 |
+
"r_wer": r_wer,
|
| 482 |
+
"p_sub": p_sub,
|
| 483 |
+
"p_len": p_len,
|
| 484 |
+
"p_tail": p_tail,
|
| 485 |
+
"p_cmp": p_cmp,
|
| 486 |
+
"p_hallu": p_hallu,
|
| 487 |
+
"p_empty": p_empty,
|
| 488 |
+
"p_del_voice": p_del_voice,
|
| 489 |
+
"p_under_voice": p_under_voice,
|
| 490 |
+
"p_sub_noise": p_sub_noise,
|
| 491 |
+
"p_cmp_noise": p_cmp_noise,
|
| 492 |
+
"reward_raw": reward_raw,
|
| 493 |
+
"reward": r,
|
| 494 |
+
},
|
| 495 |
+
)
|
| 496 |
+
|
| 497 |
+
return rewards
|
| 498 |
+
|
| 499 |
+
|
| 500 |
+
orms["asr_wer_sub_len_cmp_hallu_dirty_v56"] = ASRWerSubLenCmpHalluDirtyV56
|
0417train.sh
ADDED
|
@@ -0,0 +1,75 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
|
| 2 |
+
TRAIN_DATA="/mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/0416upload/lora_0323_10w+55w+error+syn_with_domain_train90_targeted_rl_train90_loramerged_basewer_3suppress_server.jsonl"
|
| 3 |
+
VAL_DATA="/mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/0416upload/lora_0323_10w+55w+error+syn_with_domain_train90_targeted_rl_val5_sample5p_server.jsonl" # <- 你新增的验证集
|
| 4 |
+
|
| 5 |
+
export MASTER_PORT=29540
|
| 6 |
+
export MASTER_ADDR=127.0.0.1
|
| 7 |
+
|
| 8 |
+
######################
|
| 9 |
+
# 0. 基础环境变量 (wandb)
|
| 10 |
+
######################
|
| 11 |
+
export WANDB_BASE_URL="https://api.wandb.ai"
|
| 12 |
+
export WANDB_API_KEY="af28909dd03c6220f0ad4df6bd9a0a1fbddb3e55"
|
| 13 |
+
export WANDB_PROJECT="qwen3_asr_swift_dapo" # 对应截图里的项目名
|
| 14 |
+
export WANDB_ENTITY="pang_kaiyu-none" # 对应截图里的 Entity
|
| 15 |
+
|
| 16 |
+
# 让 wandb 在多卡训练时只开一个进程写日志(可选)
|
| 17 |
+
export WANDB_MODE=online
|
| 18 |
+
export NPROC_PER_NODE=4
|
| 19 |
+
export SWIFT_SINGLE_DEVICE_MODE=1
|
| 20 |
+
export PYTORCH_CUDA_ALLOC_CONF=expandable_segments:True
|
| 21 |
+
|
| 22 |
+
|
| 23 |
+
export ASR_REWARD_DEBUG=1
|
| 24 |
+
export ASR_REWARD_DEBUG_PATH=/mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/0416upload/out/qwen3asr_dapo_reward56_4x4x12_12gen_4GPU/reward_debug
|
| 25 |
+
export ASR_REWARD_DEBUG_MAX_ROWS=1000
|
| 26 |
+
|
| 27 |
+
|
| 28 |
+
|
| 29 |
+
swift rlhf \
|
| 30 |
+
--rlhf_type grpo \
|
| 31 |
+
--external_plugins /mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/0416upload/my_qwen3_asr_dapo_register.py /mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/0416upload/0417_reward.py \
|
| 32 |
+
--model /mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/qwen3-asr-merged \
|
| 33 |
+
--model_type my_qwen3_asr_rl \
|
| 34 |
+
--template my_qwen3_asr_rl \
|
| 35 |
+
--dataset ${TRAIN_DATA} \
|
| 36 |
+
--val_dataset ${VAL_DATA} \
|
| 37 |
+
--reward_funcs asr_wer_sub_len_cmp_hallu_dirty_v56 \
|
| 38 |
+
--train_type lora \
|
| 39 |
+
--use_vllm false \
|
| 40 |
+
--log_completions true \
|
| 41 |
+
--loss_type dapo \
|
| 42 |
+
--advantage_estimator grpo \
|
| 43 |
+
--scale_rewards group \
|
| 44 |
+
--num_iterations 2 \
|
| 45 |
+
--beta 0.04 \
|
| 46 |
+
--epsilon_high 0.28 \
|
| 47 |
+
--dynamic_sample true \
|
| 48 |
+
--max_resample_times 4 \
|
| 49 |
+
--overlong_filter true \
|
| 50 |
+
--truncation_strategy delete \
|
| 51 |
+
--num_generations 12 \
|
| 52 |
+
--generation_batch_size 48 \
|
| 53 |
+
--per_device_train_batch_size 4 \
|
| 54 |
+
--per_device_eval_batch_size 4 \
|
| 55 |
+
--gradient_accumulation_steps 12 \
|
| 56 |
+
--num_generations_eval 4 \
|
| 57 |
+
--max_completion_length 256 \
|
| 58 |
+
--temperature 0.50 \
|
| 59 |
+
--top_p 0.95 \
|
| 60 |
+
--top_k 50 \
|
| 61 |
+
--repetition_penalty 1.08 \
|
| 62 |
+
--learning_rate 5e-5 \
|
| 63 |
+
--lr_scheduler_type cosine \
|
| 64 |
+
--warmup_ratio 0.03 \
|
| 65 |
+
--report_to wandb \
|
| 66 |
+
--run_name qwen3asr_dapo_reward56_4x4x12_12gen_4GPU \
|
| 67 |
+
--output_dir /mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/0416upload/out/qwen3asr_dapo_reward56_4x4x12_12gen_4GPU \
|
| 68 |
+
--save_strategy steps \
|
| 69 |
+
--save_steps 20 \
|
| 70 |
+
--logging_steps 5 \
|
| 71 |
+
--freeze_llm false \
|
| 72 |
+
--freeze_vit false \
|
| 73 |
+
--freeze_aligner false \
|
| 74 |
+
--remove_unused_columns false \
|
| 75 |
+
--padding_side left
|
wandb/debug-internal.log
ADDED
|
@@ -0,0 +1,72 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{"time":"2026-04-18T17:28:47.877484976+08:00","level":"INFO","msg":"stream: starting","core version":"0.23.0"}
|
| 2 |
+
{"time":"2026-04-18T17:28:48.347618035+08:00","level":"INFO","msg":"stream: created new stream","id":"c2a5hfz3"}
|
| 3 |
+
{"time":"2026-04-18T17:28:48.347701352+08:00","level":"INFO","msg":"handler: started","stream_id":"c2a5hfz3"}
|
| 4 |
+
{"time":"2026-04-18T17:28:48.350844585+08:00","level":"INFO","msg":"stream: started","id":"c2a5hfz3"}
|
| 5 |
+
{"time":"2026-04-18T17:28:48.350849894+08:00","level":"INFO","msg":"writer: started","stream_id":"c2a5hfz3"}
|
| 6 |
+
{"time":"2026-04-18T17:28:48.350854798+08:00","level":"INFO","msg":"sender: started","stream_id":"c2a5hfz3"}
|
| 7 |
+
{"time":"2026-04-18T17:37:33.858258418+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/pang_kaiyu-none/qwen3_asr_swift_dapo/c2a5hfz3/file_stream\": unexpected EOF"}
|
| 8 |
+
{"time":"2026-04-19T02:34:07.470718868+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/pang_kaiyu-none/qwen3_asr_swift_dapo/c2a5hfz3/file_stream\": unexpected EOF"}
|
| 9 |
+
{"time":"2026-04-19T02:38:39.32386773+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/pang_kaiyu-none/qwen3_asr_swift_dapo/c2a5hfz3/file_stream\": http2: client conn could not be established"}
|
| 10 |
+
{"time":"2026-04-19T02:40:17.658933776+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/pang_kaiyu-none/qwen3_asr_swift_dapo/c2a5hfz3/file_stream\": unexpected EOF"}
|
| 11 |
+
{"time":"2026-04-19T02:43:03.564180775+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/pang_kaiyu-none/qwen3_asr_swift_dapo/c2a5hfz3/file_stream\": unexpected EOF"}
|
| 12 |
+
{"time":"2026-04-19T02:44:49.518795314+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/pang_kaiyu-none/qwen3_asr_swift_dapo/c2a5hfz3/file_stream\": unexpected EOF"}
|
| 13 |
+
{"time":"2026-04-19T02:45:08.529740538+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/pang_kaiyu-none/qwen3_asr_swift_dapo/c2a5hfz3/file_stream\": unexpected EOF"}
|
| 14 |
+
{"time":"2026-04-19T02:46:20.848321936+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/pang_kaiyu-none/qwen3_asr_swift_dapo/c2a5hfz3/file_stream\": unexpected EOF"}
|
| 15 |
+
{"time":"2026-04-19T02:49:05.639172159+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/pang_kaiyu-none/qwen3_asr_swift_dapo/c2a5hfz3/file_stream\": unexpected EOF"}
|
| 16 |
+
{"time":"2026-04-19T15:09:49.426045163+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/pang_kaiyu-none/qwen3_asr_swift_dapo/c2a5hfz3/file_stream\": unexpected EOF"}
|
| 17 |
+
{"time":"2026-04-19T15:57:04.347389276+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/pang_kaiyu-none/qwen3_asr_swift_dapo/c2a5hfz3/file_stream\": unexpected EOF"}
|
| 18 |
+
{"time":"2026-04-19T16:02:30.488210102+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/pang_kaiyu-none/qwen3_asr_swift_dapo/c2a5hfz3/file_stream\": unexpected EOF"}
|
| 19 |
+
{"time":"2026-04-19T22:07:33.03303113+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/pang_kaiyu-none/qwen3_asr_swift_dapo/c2a5hfz3/file_stream\": unexpected EOF"}
|
| 20 |
+
{"time":"2026-04-19T22:07:51.98901393+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/pang_kaiyu-none/qwen3_asr_swift_dapo/c2a5hfz3/file_stream\": unexpected EOF"}
|
| 21 |
+
{"time":"2026-04-19T22:08:16.035247515+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/pang_kaiyu-none/qwen3_asr_swift_dapo/c2a5hfz3/file_stream\": unexpected EOF"}
|
| 22 |
+
{"time":"2026-04-19T22:09:42.186767689+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/pang_kaiyu-none/qwen3_asr_swift_dapo/c2a5hfz3/file_stream\": unexpected EOF"}
|
| 23 |
+
{"time":"2026-04-19T22:24:00.480169619+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/pang_kaiyu-none/qwen3_asr_swift_dapo/c2a5hfz3/file_stream\": unexpected EOF"}
|
| 24 |
+
{"time":"2026-04-19T22:24:34.690158146+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/pang_kaiyu-none/qwen3_asr_swift_dapo/c2a5hfz3/file_stream\": unexpected EOF"}
|
| 25 |
+
{"time":"2026-04-19T22:28:36.622066809+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/pang_kaiyu-none/qwen3_asr_swift_dapo/c2a5hfz3/file_stream\": unexpected EOF"}
|
| 26 |
+
{"time":"2026-04-19T22:28:59.75540152+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/pang_kaiyu-none/qwen3_asr_swift_dapo/c2a5hfz3/file_stream\": unexpected EOF"}
|
| 27 |
+
{"time":"2026-04-19T22:31:22.975036457+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/pang_kaiyu-none/qwen3_asr_swift_dapo/c2a5hfz3/file_stream\": unexpected EOF"}
|
| 28 |
+
{"time":"2026-04-19T22:34:17.890202383+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/pang_kaiyu-none/qwen3_asr_swift_dapo/c2a5hfz3/file_stream\": unexpected EOF"}
|
| 29 |
+
{"time":"2026-04-19T22:43:21.155119859+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/pang_kaiyu-none/qwen3_asr_swift_dapo/c2a5hfz3/file_stream\": unexpected EOF"}
|
| 30 |
+
{"time":"2026-04-19T22:43:38.33530735+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/pang_kaiyu-none/qwen3_asr_swift_dapo/c2a5hfz3/file_stream\": unexpected EOF"}
|
| 31 |
+
{"time":"2026-04-19T22:46:03.44895843+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/pang_kaiyu-none/qwen3_asr_swift_dapo/c2a5hfz3/file_stream\": unexpected EOF"}
|
| 32 |
+
{"time":"2026-04-19T22:48:50.248056745+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/pang_kaiyu-none/qwen3_asr_swift_dapo/c2a5hfz3/file_stream\": unexpected EOF"}
|
| 33 |
+
{"time":"2026-04-19T22:49:48.447601198+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/pang_kaiyu-none/qwen3_asr_swift_dapo/c2a5hfz3/file_stream\": unexpected EOF"}
|
| 34 |
+
{"time":"2026-04-19T22:52:35.56119014+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/pang_kaiyu-none/qwen3_asr_swift_dapo/c2a5hfz3/file_stream\": unexpected EOF"}
|
| 35 |
+
{"time":"2026-04-19T22:52:50.371922946+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/pang_kaiyu-none/qwen3_asr_swift_dapo/c2a5hfz3/file_stream\": unexpected EOF"}
|
| 36 |
+
{"time":"2026-04-19T22:56:30.747794336+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/pang_kaiyu-none/qwen3_asr_swift_dapo/c2a5hfz3/file_stream\": unexpected EOF"}
|
| 37 |
+
{"time":"2026-04-19T22:58:32.547706574+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/pang_kaiyu-none/qwen3_asr_swift_dapo/c2a5hfz3/file_stream\": unexpected EOF"}
|
| 38 |
+
{"time":"2026-04-19T23:00:23.617563694+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/pang_kaiyu-none/qwen3_asr_swift_dapo/c2a5hfz3/file_stream\": unexpected EOF"}
|
| 39 |
+
{"time":"2026-04-19T23:00:37.717734501+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/pang_kaiyu-none/qwen3_asr_swift_dapo/c2a5hfz3/file_stream\": unexpected EOF"}
|
| 40 |
+
{"time":"2026-04-19T23:05:31.94573349+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/pang_kaiyu-none/qwen3_asr_swift_dapo/c2a5hfz3/file_stream\": unexpected EOF"}
|
| 41 |
+
{"time":"2026-04-19T23:05:44.893259249+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/pang_kaiyu-none/qwen3_asr_swift_dapo/c2a5hfz3/file_stream\": unexpected EOF"}
|
| 42 |
+
{"time":"2026-04-20T00:03:04.382543732+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/pang_kaiyu-none/qwen3_asr_swift_dapo/c2a5hfz3/file_stream\": unexpected EOF"}
|
| 43 |
+
{"time":"2026-04-20T00:03:19.501053157+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/pang_kaiyu-none/qwen3_asr_swift_dapo/c2a5hfz3/file_stream\": unexpected EOF"}
|
| 44 |
+
{"time":"2026-04-20T00:05:31.556601347+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/pang_kaiyu-none/qwen3_asr_swift_dapo/c2a5hfz3/file_stream\": unexpected EOF"}
|
| 45 |
+
{"time":"2026-04-20T00:06:03.495128433+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/pang_kaiyu-none/qwen3_asr_swift_dapo/c2a5hfz3/file_stream\": unexpected EOF"}
|
| 46 |
+
{"time":"2026-04-20T00:11:23.73287074+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/pang_kaiyu-none/qwen3_asr_swift_dapo/c2a5hfz3/file_stream\": unexpected EOF"}
|
| 47 |
+
{"time":"2026-04-20T02:58:43.522847172+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/graphql\": net/http: request canceled (Client.Timeout exceeded while awaiting headers)"}
|
| 48 |
+
{"time":"2026-04-20T02:59:04.598457045+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/pang_kaiyu-none/qwen3_asr_swift_dapo/c2a5hfz3/file_stream\": context deadline exceeded"}
|
| 49 |
+
{"time":"2026-04-20T02:59:15.733502761+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/graphql\": context deadline exceeded (Client.Timeout exceeded while awaiting headers)"}
|
| 50 |
+
{"time":"2026-04-20T02:59:49.917399553+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/graphql\": context deadline exceeded (Client.Timeout exceeded while awaiting headers)"}
|
| 51 |
+
{"time":"2026-04-20T03:00:07.058218433+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/pang_kaiyu-none/qwen3_asr_swift_dapo/c2a5hfz3/file_stream\": context deadline exceeded"}
|
| 52 |
+
{"time":"2026-04-20T03:00:29.606621937+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/graphql\": net/http: request canceled (Client.Timeout exceeded while awaiting headers)"}
|
| 53 |
+
{"time":"2026-04-20T03:00:34.624296643+08:00","level":"INFO","msg":"flowcontrol: backed up, offloading to disk","recordNumber":124381}
|
| 54 |
+
{"time":"2026-04-20T03:00:46.264621657+08:00","level":"INFO","msg":"flowcontrol: unblocked","totalOffloaded":1}
|
| 55 |
+
{"time":"2026-04-20T03:44:43.734398398+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/graphql\": context deadline exceeded (Client.Timeout exceeded while awaiting headers)"}
|
| 56 |
+
{"time":"2026-04-20T04:11:48.762158534+08:00","level":"INFO","msg":"api: retrying HTTP error","status":503,"url":"https://api.wandb.ai/graphql","body":"upstream connect error or disconnect/reset before headers. reset reason: connection termination"}
|
| 57 |
+
{"time":"2026-04-20T04:13:58.74920069+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/graphql\": net/http: request canceled (Client.Timeout exceeded while awaiting headers)"}
|
| 58 |
+
{"time":"2026-04-20T06:34:34.21211755+08:00","level":"INFO","msg":"api: retrying HTTP error","status":503,"url":"https://api.wandb.ai/graphql","body":"upstream connect error or disconnect/reset before headers. reset reason: connection termination"}
|
| 59 |
+
{"time":"2026-04-20T10:50:53.628901466+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/pang_kaiyu-none/qwen3_asr_swift_dapo/c2a5hfz3/file_stream\": unexpected EOF"}
|
| 60 |
+
{"time":"2026-04-20T16:00:42.158363018+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/pang_kaiyu-none/qwen3_asr_swift_dapo/c2a5hfz3/file_stream\": unexpected EOF"}
|
| 61 |
+
{"time":"2026-04-20T16:02:08.101875007+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/pang_kaiyu-none/qwen3_asr_swift_dapo/c2a5hfz3/file_stream\": unexpected EOF"}
|
| 62 |
+
{"time":"2026-04-20T16:03:45.141714956+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/pang_kaiyu-none/qwen3_asr_swift_dapo/c2a5hfz3/file_stream\": unexpected EOF"}
|
| 63 |
+
{"time":"2026-04-20T16:04:52.17332644+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/pang_kaiyu-none/qwen3_asr_swift_dapo/c2a5hfz3/file_stream\": unexpected EOF"}
|
| 64 |
+
{"time":"2026-04-20T16:05:06.320377956+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/pang_kaiyu-none/qwen3_asr_swift_dapo/c2a5hfz3/file_stream\": unexpected EOF"}
|
| 65 |
+
{"time":"2026-04-20T16:05:29.800728083+08:00","level":"ERROR","msg":"sender: sendStopStatus: failed to get run stopped status: context deadline exceeded (Client.Timeout or context cancellation while reading body)"}
|
| 66 |
+
{"time":"2026-04-20T16:05:30.799799131+08:00","level":"INFO","msg":"stream: closing","id":"c2a5hfz3"}
|
| 67 |
+
{"time":"2026-04-20T16:05:39.191906442+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/pang_kaiyu-none/qwen3_asr_swift_dapo/c2a5hfz3/file_stream\": unexpected EOF"}
|
| 68 |
+
{"time":"2026-04-20T16:05:43.710909983+08:00","level":"INFO","msg":"fileTransfer: Close: file transfer manager closed"}
|
| 69 |
+
{"time":"2026-04-20T16:06:10.469686843+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/pang_kaiyu-none/qwen3_asr_swift_dapo/c2a5hfz3/file_stream\": unexpected EOF"}
|
| 70 |
+
{"time":"2026-04-20T16:06:17.397266507+08:00","level":"INFO","msg":"handler: closed","stream_id":"c2a5hfz3"}
|
| 71 |
+
{"time":"2026-04-20T16:06:17.400263519+08:00","level":"INFO","msg":"sender: closed","stream_id":"c2a5hfz3"}
|
| 72 |
+
{"time":"2026-04-20T16:06:17.40028542+08:00","level":"INFO","msg":"stream: closed","id":"c2a5hfz3"}
|
wandb/debug.log
ADDED
|
@@ -0,0 +1,26 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
2026-04-18 17:28:47,491 INFO MainThread:10295 [wandb_setup.py:_flush():80] Current SDK version is 0.23.0
|
| 2 |
+
2026-04-18 17:28:47,491 INFO MainThread:10295 [wandb_setup.py:_flush():80] Configure stats pid to 10295
|
| 3 |
+
2026-04-18 17:28:47,491 INFO MainThread:10295 [wandb_setup.py:_flush():80] Loading settings from /mnt/petrelfs/panjiabao/.config/wandb/settings
|
| 4 |
+
2026-04-18 17:28:47,491 INFO MainThread:10295 [wandb_setup.py:_flush():80] Loading settings from /mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/0416upload/wandb/settings
|
| 5 |
+
2026-04-18 17:28:47,491 INFO MainThread:10295 [wandb_setup.py:_flush():80] Loading settings from environment variables
|
| 6 |
+
2026-04-18 17:28:47,491 INFO MainThread:10295 [wandb_init.py:setup_run_log_directory():713] Logging user logs to /mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/0416upload/wandb/run-20260418_172847-c2a5hfz3/logs/debug.log
|
| 7 |
+
2026-04-18 17:28:47,491 INFO MainThread:10295 [wandb_init.py:setup_run_log_directory():714] Logging internal logs to /mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/0416upload/wandb/run-20260418_172847-c2a5hfz3/logs/debug-internal.log
|
| 8 |
+
2026-04-18 17:28:47,491 INFO MainThread:10295 [wandb_init.py:init():840] calling init triggers
|
| 9 |
+
2026-04-18 17:28:47,491 INFO MainThread:10295 [wandb_init.py:init():845] wandb.init called with sweep_config: {}
|
| 10 |
+
config: {'_wandb': {}}
|
| 11 |
+
2026-04-18 17:28:47,491 INFO MainThread:10295 [wandb_init.py:init():888] starting backend
|
| 12 |
+
2026-04-18 17:28:47,865 INFO MainThread:10295 [wandb_init.py:init():891] sending inform_init request
|
| 13 |
+
2026-04-18 17:28:47,870 INFO MainThread:10295 [wandb_init.py:init():899] backend started and connected
|
| 14 |
+
2026-04-18 17:28:47,874 INFO MainThread:10295 [wandb_init.py:init():969] updated telemetry
|
| 15 |
+
2026-04-18 17:28:47,875 INFO MainThread:10295 [wandb_init.py:init():993] communicating run to backend with 90.0 second timeout
|
| 16 |
+
2026-04-18 17:28:49,589 INFO MainThread:10295 [wandb_init.py:init():1040] starting run threads in backend
|
| 17 |
+
2026-04-18 17:28:50,217 INFO MainThread:10295 [wandb_run.py:_console_start():2504] atexit reg
|
| 18 |
+
2026-04-18 17:28:50,218 INFO MainThread:10295 [wandb_run.py:_redirect():2352] redirect: wrap_raw
|
| 19 |
+
2026-04-18 17:28:50,218 INFO MainThread:10295 [wandb_run.py:_redirect():2421] Wrapping output streams.
|
| 20 |
+
2026-04-18 17:28:50,218 INFO MainThread:10295 [wandb_run.py:_redirect():2444] Redirects installed.
|
| 21 |
+
2026-04-18 17:28:50,224 INFO MainThread:10295 [wandb_init.py:init():1080] run started, returning control to user process
|
| 22 |
+
2026-04-18 17:28:50,229 INFO MainThread:10295 [wandb_run.py:_config_callback():1385] config_cb None None {'peft_config': {'default': {'task_type': 'CAUSAL_LM', 'peft_type': 'LORA', 'auto_mapping': None, 'peft_version': '0.18.1', 'base_model_name_or_path': '/mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/qwen3-asr-merged', 'revision': None, 'inference_mode': False, 'r': 8, 'target_modules': '^(thinker\\.model(?=\\.).*\\.(up_proj|q_proj|o_proj|gate_proj|k_proj|v_proj|down_proj)|thinker\\.audio_tower\\.layers(?=\\.).*\\.(q_proj|fc1|out_proj|k_proj|v_proj|fc2)|thinker\\.audio_tower\\.conv_out(?=\\.)|thinker\\.audio_tower\\.proj1(?=\\.)|thinker\\.audio_tower\\.proj2(?=\\.))$', 'exclude_modules': None, 'lora_alpha': 32, 'lora_dropout': 0.05, 'fan_in_fan_out': False, 'bias': 'none', 'use_rslora': False, 'modules_to_save': [], 'init_lora_weights': True, 'layers_to_transform': None, 'layers_pattern': None, 'rank_pattern': {}, 'alpha_pattern': {}, 'megatron_config': None, 'megatron_core': 'megatron.core', 'trainable_token_indices': None, 'loftq_config': {}, 'eva_config': None, 'corda_config': None, 'use_dora': False, 'alora_invocation_tokens': None, 'use_qalora': False, 'qalora_group_size': 16, 'layer_replication': None, 'runtime_config': {'ephemeral_gpu_offload': False}, 'lora_bias': False, 'target_parameters': None, 'arrow_config': None, 'ensure_weight_tying': False, 'lora_dtype': None, 'lorap_lr_ratio': None, 'lorap_emb_lr': 1e-06}}, 'return_dict': True, 'output_hidden_states': False, 'torchscript': False, 'dtype': 'bfloat16', 'pruned_heads': {}, 'tie_word_embeddings': True, 'chunk_size_feed_forward': 0, 'is_encoder_decoder': False, 'is_decoder': False, 'cross_attention_hidden_size': None, 'add_cross_attention': False, 'tie_encoder_decoder': False, 'architectures': ['Qwen3ASRForConditionalGeneration'], 'finetuning_task': None, 'id2label': {0: 'LABEL_0', 1: 'LABEL_1'}, 'label2id': {'LABEL_0': 0, 'LABEL_1': 1}, 'task_specific_params': None, 'problem_type': None, 'tokenizer_class': None, 'prefix': None, 'bos_token_id': None, 'pad_token_id': 151643, 'eos_token_id': 151645, 'sep_token_id': None, 'decoder_start_token_id': None, 'max_length': 20, 'min_length': 0, 'do_sample': False, 'early_stopping': False, 'num_beams': 1, 'temperature': 0.5, 'top_k': 50, 'top_p': 0.95, 'typical_p': 1.0, 'repetition_penalty': 1.08, 'length_penalty': 1.0, 'no_repeat_ngram_size': 0, 'encoder_no_repeat_ngram_size': 0, 'bad_words_ids': None, 'num_return_sequences': 1, 'output_scores': False, 'return_dict_in_generate': False, 'forced_bos_token_id': None, 'forced_eos_token_id': None, 'remove_invalid_values': False, 'exponential_decay_length_penalty': None, 'suppress_tokens': None, 'begin_suppress_tokens': None, 'num_beam_groups': 1, 'diversity_penalty': 0.0, '_name_or_path': '/mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/qwen3-asr-merged', 'transformers_version': '4.57.6', 'model_type': 'qwen3_asr', 'tf_legacy_loss': False, 'use_bfloat16': False, 'thinker_config': {'return_dict': True, 'output_hidden_states': False, 'torchscript': False, 'dtype': 'bfloat16', 'pruned_heads': {}, 'tie_word_embeddings': True, 'chunk_size_feed_forward': 0, 'is_encoder_decoder': False, 'is_decoder': False, 'cross_attention_hidden_size': None, 'add_cross_attention': False, 'tie_encoder_decoder': False, 'architectures': ['Qwen3ASRForConditionalGeneration'], 'finetuning_task': None, 'id2label': {0: 'LABEL_0', 1: 'LABEL_1'}, 'label2id': {'LABEL_0': 0, 'LABEL_1': 1}, 'task_specific_params': None, 'problem_type': None, 'tokenizer_class': None, 'prefix': None, 'bos_token_id': None, 'pad_token_id': None, 'eos_token_id': None, 'sep_token_id': None, 'decoder_start_token_id': None, 'max_length': 20, 'min_length': 0, 'do_sample': False, 'early_stopping': False, 'num_beams': 1, 'temperature': 1.0, 'top_k': 50, 'top_p': 1.0, 'typical_p': 1.0, 'repetition_penalty': 1.0, 'length_penalty': 1.0, 'no_repeat_ngram_size': 0, 'encoder_no_repeat_ngram_size': 0, 'bad_words_ids': None, 'num_return_sequences': 1, 'output_scores': False, 'return_dict_in_generate': False, 'forced_bos_token_id': None, 'forced_eos_token_id': None, 'remove_invalid_values': False, 'exponential_decay_length_penalty': None, 'suppress_tokens': None, 'begin_suppress_tokens': None, 'num_beam_groups': 1, 'diversity_penalty': 0.0, '_name_or_path': '', 'audio_end_token_id': 151670, 'model_type': 'qwen3_asr_thinker', 'tf_legacy_loss': False, 'use_bfloat16': False, 'user_token_id': 872, 'audio_start_token_id': 151669, 'initializer_range': 0.02, 'audio_config': {'return_dict': True, 'output_hidden_states': False, 'torchscript': False, 'dtype': None, 'pruned_heads': {}, 'tie_word_embeddings': True, 'chunk_size_feed_forward': 0, 'is_encoder_decoder': False, 'is_decoder': False, 'cross_attention_hidden_size': None, 'add_cross_attention': False, 'tie_encoder_decoder': False, 'architectures': None, 'finetuning_task': None, 'id2label': {0: 'LABEL_0', 1: 'LABEL_1'}, 'label2id': {'LABEL_0': 0, 'LABEL_1': 1}, 'task_specific_params': None, 'problem_type': None, 'tokenizer_class': None, 'prefix': None, 'bos_token_id': None, 'pad_token_id': None, 'eos_token_id': None, 'sep_token_id': None, 'decoder_start_token_id': None, 'max_length': 20, 'min_length': 0, 'do_sample': False, 'early_stopping': False, 'num_beams': 1, 'temperature': 1.0, 'top_k': 50, 'top_p': 1.0, 'typical_p': 1.0, 'repetition_penalty': 1.0, 'length_penalty': 1.0, 'no_repeat_ngram_size': 0, 'encoder_no_repeat_ngram_size': 0, 'bad_words_ids': None, 'num_return_sequences': 1, 'output_scores': False, 'return_dict_in_generate': False, 'forced_bos_token_id': None, 'forced_eos_token_id': None, 'remove_invalid_values': False, 'exponential_decay_length_penalty': None, 'suppress_tokens': None, 'begin_suppress_tokens': None, 'num_beam_groups': 1, 'diversity_penalty': 0.0, '_name_or_path': '', 'model_type': 'qwen3_asr_audio_encoder', 'num_hidden_layers': 24, 'tf_legacy_loss': False, 'use_bfloat16': False, 'num_mel_bins': 128, 'd_model': 1024, 'encoder_layers': 24, 'encoder_attention_heads': 16, 'encoder_ffn_dim': 4096, 'dropout': 0, 'attention_dropout': 0, 'activation_function': 'gelu', 'activation_dropout': 0, 'initializer_range': 0.02, 'scale_embedding': False, 'max_source_positions': 1500, 'n_window': 50, 'output_dim': 2048, 'n_window_infer': 800, 'conv_chunksize': 500, 'downsample_hidden_size': 480, 'output_attentions': False}, 'text_config': {'vocab_size': 151936, 'max_position_embeddings': 65536, 'hidden_size': 2048, 'intermediate_size': 6144, 'num_hidden_layers': 28, 'num_attention_heads': 16, 'num_key_value_heads': 8, 'head_dim': 128, 'hidden_act': 'silu', 'initializer_range': 0.02, 'rms_norm_eps': 1e-06, 'use_cache': False, 'rope_theta': 1000000, 'rope_scaling': {'interleaved': True, 'mrope_interleaved': True, 'mrope_section': [24, 20, 20], 'rope_type': 'default', 'type': 'default'}, 'attention_bias': False, 'attention_dropout': 0.0, 'return_dict': True, 'output_hidden_states': False, 'torchscript': False, 'dtype': None, 'pruned_heads': {}, 'tie_word_embeddings': True, 'chunk_size_feed_forward': 0, 'is_encoder_decoder': False, 'is_decoder': False, 'cross_attention_hidden_size': None, 'add_cross_attention': False, 'tie_encoder_decoder': False, 'architectures': None, 'finetuning_task': None, 'id2label': {0: 'LABEL_0', 1: 'LABEL_1'}, 'label2id': {'LABEL_0': 0, 'LABEL_1': 1}, 'task_specific_params': None, 'problem_type': None, 'tokenizer_class': None, 'prefix': None, 'bos_token_id': None, 'pad_token_id': 151643, 'eos_token_id': None, 'sep_token_id': None, 'decoder_start_token_id': None, 'max_length': 20, 'min_length': 0, 'do_sample': False, 'early_stopping': False, 'num_beams': 1, 'temperature': 1.0, 'top_k': 50, 'top_p': 1.0, 'typical_p': 1.0, 'repetition_penalty': 1.0, 'length_penalty': 1.0, 'no_repeat_ngram_size': 0, 'encoder_no_repeat_ngram_size': 0, 'bad_words_ids': None, 'num_return_sequences': 1, 'output_scores': False, 'return_dict_in_generate': False, 'forced_bos_token_id': None, 'forced_eos_token_id': None, 'remove_invalid_values': False, 'exponential_decay_length_penalty': None, 'suppress_tokens': None, 'begin_suppress_tokens': None, 'num_beam_groups': 1, 'diversity_penalty': 0.0, '_name_or_path': '', 'model_type': 'qwen3_asr_text', 'tf_legacy_loss': False, 'use_bfloat16': False, 'output_attentions': False}, 'audio_token_id': 151676, 'output_attentions': False}, 'support_languages': ['Chinese', 'English', 'Cantonese', 'Arabic', 'German', 'French', 'Spanish', 'Portuguese', 'Indonesian', 'Italian', 'Korean', 'Russian', 'Thai', 'Vietnamese', 'Japanese', 'Turkish', 'Hindi', 'Malay', 'Dutch', 'Swedish', 'Danish', 'Finnish', 'Polish', 'Czech', 'Filipino', 'Persian', 'Greek', 'Romanian', 'Hungarian', 'Macedonian'], 'output_attentions': False, 'output_dir': '/mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/0416upload/out/qwen3asr_dapo_reward56_4x4x12_12gen_4GPU/v5-20260418-172837', 'overwrite_output_dir': False, 'do_train': False, 'do_eval': True, 'do_predict': False, 'eval_strategy': 'steps', 'prediction_loss_only': False, 'per_device_train_batch_size': 4, 'per_device_eval_batch_size': 4, 'per_gpu_train_batch_size': None, 'per_gpu_eval_batch_size': None, 'gradient_accumulation_steps': 12, 'eval_accumulation_steps': None, 'eval_delay': 0, 'torch_empty_cache_steps': None, 'learning_rate': 5e-05, 'weight_decay': 0.1, 'adam_beta1': 0.9, 'adam_beta2': 0.95, 'adam_epsilon': 1e-08, 'max_grad_norm': 1.0, 'num_train_epochs': 3.0, 'max_steps': -1, 'lr_scheduler_type': 'cosine', 'lr_scheduler_kwargs': None, 'warmup_ratio': 0.03, 'warmup_steps': 0, 'log_level': 'passive', 'log_level_replica': 'warning', 'log_on_each_node': True, 'logging_dir': '/mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/0416upload/out/qwen3asr_dapo_reward56_4x4x12_12gen_4GPU/v5-20260418-172837/runs', 'logging_strategy': 'steps', 'logging_first_step': True, 'logging_steps': 5, 'logging_nan_inf_filter': True, 'save_strategy': 'steps', 'save_steps': 20, 'save_total_limit': None, 'save_safetensors': True, 'save_on_each_node': False, 'save_only_model': False, 'restore_callback_states_from_checkpoint': False, 'no_cuda': False, 'use_cpu': False, 'use_mps_device': False, 'seed': 42, 'data_seed': 42, 'jit_mode_eval': False, 'bf16': True, 'fp16': False, 'fp16_opt_level': 'O1', 'half_precision_backend': 'auto', 'bf16_full_eval': False, 'fp16_full_eval': False, 'tf32': None, 'local_rank': 0, 'ddp_backend': None, 'tpu_num_cores': None, 'tpu_metrics_debug': False, 'debug': [], 'dataloader_drop_last': True, 'eval_steps': 20, 'dataloader_num_workers': 1, 'dataloader_prefetch_factor': 2, 'past_index': -1, 'run_name': 'qwen3asr_dapo_reward56_4x4x12_12gen_4GPU', 'disable_tqdm': False, 'remove_unused_columns': False, 'label_names': None, 'load_best_model_at_end': False, 'metric_for_best_model': 'loss', 'greater_is_better': False, 'ignore_data_skip': False, 'fsdp': [], 'fsdp_min_num_params': 0, 'fsdp_config': {'min_num_params': 0, 'xla': False, 'xla_fsdp_v2': False, 'xla_fsdp_grad_ckpt': False}, 'fsdp_transformer_layer_cls_to_wrap': None, 'accelerator_config': {'split_batches': False, 'dispatch_batches': False, 'even_batches': True, 'use_seedable_sampler': True, 'non_blocking': False, 'gradient_accumulation_kwargs': None}, 'parallelism_config': None, 'deepspeed': None, 'label_smoothing_factor': 0.0, 'optim': 'adamw_torch', 'optim_args': None, 'adafactor': False, 'group_by_length': False, 'length_column_name': 'length', 'report_to': ['wandb'], 'project': 'huggingface', 'trackio_space_id': 'trackio', 'ddp_find_unused_parameters': None, 'ddp_bucket_cap_mb': None, 'ddp_broadcast_buffers': None, 'dataloader_pin_memory': True, 'dataloader_persistent_workers': False, 'skip_memory_metrics': True, 'use_legacy_prediction_loop': False, 'push_to_hub': False, 'resume_from_checkpoint': None, 'hub_model_id': None, 'hub_strategy': 'every_save', 'hub_token': '<HUB_TOKEN>', 'hub_private_repo': None, 'hub_always_push': False, 'hub_revision': None, 'gradient_checkpointing': False, 'gradient_checkpointing_kwargs': None, 'include_inputs_for_metrics': False, 'include_for_metrics': [], 'eval_do_concat_batches': True, 'fp16_backend': 'auto', 'push_to_hub_model_id': None, 'push_to_hub_organization': None, 'push_to_hub_token': '<PUSH_TO_HUB_TOKEN>', 'mp_parameters': '', 'auto_find_batch_size': False, 'full_determinism': False, 'torchdynamo': None, 'ray_scope': 'last', 'ddp_timeout': 18000000, 'torch_compile': False, 'torch_compile_backend': None, 'torch_compile_mode': None, 'include_tokens_per_second': False, 'include_num_input_tokens_seen': 'no', 'neftune_noise_alpha': None, 'optim_target_modules': None, 'batch_eval_metrics': False, 'eval_on_start': False, 'use_liger_kernel': False, 'liger_kernel_config': None, 'eval_use_gather_object': False, 'average_tokens_across_devices': True, 'model_init_kwargs': None, 'disable_dropout': False, 'cast_lm_head_to_fp32': False, 'num_generations': 12, 'num_generations_eval': 4, 'max_completion_length': 256, 'ds3_gather_for_generation': True, 'shuffle_dataset': True, 'generation_batch_size': 48, 'steps_per_generation': 3, 'min_p': None, 'generation_kwargs': None, 'chat_template_kwargs': None, 'use_transformers_paged': False, 'cache_implementation': None, 'use_vllm': False, 'vllm_mode': None, 'vllm_model_impl': 'vllm', 'vllm_enable_sleep_mode': False, 'vllm_structured_outputs_regex': None, 'vllm_server_base_url': None, 'vllm_server_host': None, 'vllm_server_port': [8000], 'vllm_server_timeout': 240.0, 'vllm_group_port': 51216, 'vllm_gpu_memory_utilization': 0.9, 'vllm_max_model_length': None, 'vllm_tensor_parallel_size': 1, 'beta': 0.04, 'num_iterations': 2, 'epsilon': 0.2, 'delta': None, 'epsilon_high': 0.28, 'sapo_temperature_neg': 1.05, 'sapo_temperature_pos': 1.0, 'importance_sampling_level': 'token', 'reward_weights': None, 'multi_objective_aggregation': 'sum_then_normalize', 'scale_rewards': 'group', 'loss_type': 'dapo', 'mask_truncated_completions': False, 'sync_ref_model': False, 'ref_model_mixup_alpha': 0.6, 'ref_model_sync_steps': 512, 'top_entropy_quantile': 1.0, 'max_tool_calling_iterations': None, 'vllm_importance_sampling_correction': True, 'vllm_importance_sampling_mode': 'sequence_mask', 'vllm_importance_sampling_cap': 3.0, 'off_policy_mask_threshold': None, 'use_bias_correction_kl': False, 'log_completions': True, 'num_completions_to_print': None, 'log_unique_prompts': False, 'log_completions_hub_repo': None, 'tuner_backend': 'peft', 'vit_gradient_checkpointing': True, 'router_aux_loss_coef': 0.0, 'enable_dft_loss': False, 'enable_channel_loss': False, 'safe_serialization': True, 'max_shard_size': '5GB', 'check_model': True, 'acc_strategy': 'token', 'train_dataloader_shuffle': True, 'max_epochs': None, 'aligner_lr': None, 'vit_lr': None, 'use_logits_to_keep': None, 'resume_only_model': False, 'optimizer': None, 'eval_metric': None, 'callbacks': [], 'early_stop_interval': None, 'eval_use_evalscope': False, 'eval_dataset': [], 'eval_dataset_args': None, 'eval_limit': None, 'eval_generation_config': None, 'extra_eval_args': None, 'tuner_type': 'lora', 'use_galore': False, 'galore_target_modules': None, 'galore_rank': 128, 'galore_update_proj_gap': 50, 'galore_scale': 1.0, 'galore_proj_type': 'std', 'galore_optim_per_parameter': False, 'galore_with_embedding': False, 'galore_quantization': False, 'galore_proj_quant': False, 'galore_proj_bits': 4, 'galore_proj_group_size': 256, 'galore_cos_threshold': 0.4, 'galore_gamma_proj': 2, 'galore_queue_size': 5, 'lisa_activated_layers': 0, 'lisa_step_interval': 20, 'use_flash_ckpt': False, 'vllm_pipeline_parallel_size': 1, 'vllm_enable_expert_parallel': False, 'vllm_max_num_seqs': None, 'vllm_max_model_len': None, 'vllm_disable_custom_all_reduce': True, 'vllm_enforce_eager': False, 'vllm_limit_mm_per_prompt': None, 'vllm_max_lora_rank': 16, 'vllm_enable_prefix_caching': True, 'vllm_use_async_engine': None, 'vllm_quantization': None, 'vllm_reasoning_parser': None, 'vllm_disable_cascade_attn': False, 'vllm_mm_processor_cache_gb': None, 'vllm_speculative_config': None, 'vllm_engine_kwargs': {}, 'vllm_data_parallel_size': 1, 'stop_words': [], 'vllm_enable_lora': False, 'lora_rank': 8, 'vllm_server_group_port': None, 'enable_flattened_weight_sync': True, 'async_generate': False, 'structured_outputs_regex': None, 'sleep_level': 0, 'move_model_batches': None, 'offload_optimizer': False, 'offload_model': False, 'wandb_log_unique_prompts': None, 'cosine_min_len_value_wrong': -0.5, 'cosine_max_len_value_wrong': 0.0, 'cosine_min_len_value_correct': 1.0, 'cosine_max_len_value_correct': 0.5, 'cosine_max_len': 256, 'repetition_n_grams': 3, 'repetition_max_penalty': -1.0, 'reward_model': None, 'reward_model_plugin': None, 'chord_sft_dataset': [], 'chord_sft_per_device_train_batch_size': None, 'chord_enable_phi_function': False, 'chord_mu_warmup_steps': None, 'chord_mu_decay_steps': None, 'chord_mu_peak': None, 'chord_mu_valley': None, 'multi_turn_scheduler': None, 'max_turns': None, 'completion_length_limit_scope': 'per_round', 'vllm_server_pass_dataset': False, 'dynamic_sample': True, 'max_resample_times': 4, 'overlong_filter': True, 'soft_max_length': None, 'soft_cache_length': None, 'log_entropy': False, 'tau_pos': 1.0, 'tau_neg': 1.05, 'advantage_estimator': 'grpo', 'kl_in_reward': False, 'dataset_shuffle': True, 'rollout_importance_sampling_mode': None, 'rollout_importance_sampling_threshold': 2.0, 'log_rollout_offpolicy_metrics': False, 'off_policy_sequence_mask_delta': None}
|
| 23 |
+
2026-04-18 17:28:50,239 INFO MainThread:10295 [wandb_config.py:__setitem__():154] [no run ID] config set model/num_parameters = 2050307712 - <bound method Run._config_callback of <wandb.sdk.wandb_run.Run object at 0x7f7e494768f0>>
|
| 24 |
+
2026-04-18 17:28:50,239 INFO MainThread:10295 [wandb_run.py:_config_callback():1385] config_cb model/num_parameters 2050307712 None
|
| 25 |
+
2026-04-20 16:05:30,791 INFO wandb-AsyncioManager-main:10295 [service_client.py:_forward_responses():80] Reached EOF.
|
| 26 |
+
2026-04-20 16:05:30,792 INFO wandb-AsyncioManager-main:10295 [mailbox.py:close():137] Closing mailbox, abandoning 1 handles.
|
wandb/run-20260417_122253-6ntp64iz/files/output.log
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
wandb/run-20260417_122253-6ntp64iz/files/requirements.txt
ADDED
|
@@ -0,0 +1,255 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
psutil==7.2.2
|
| 2 |
+
colorama==0.4.6
|
| 3 |
+
typing-inspection==0.4.2
|
| 4 |
+
dill==0.3.8
|
| 5 |
+
aliyun-python-sdk-kms==2.16.5
|
| 6 |
+
urllib3==2.6.3
|
| 7 |
+
torch==2.6.0
|
| 8 |
+
threadpoolctl==3.6.0
|
| 9 |
+
pyzmq==27.1.0
|
| 10 |
+
astor==0.8.1
|
| 11 |
+
hf-xet==1.4.3
|
| 12 |
+
sniffio==1.3.1
|
| 13 |
+
tensorboard==2.20.0
|
| 14 |
+
fastar==0.11.0
|
| 15 |
+
llvmlite==0.43.0
|
| 16 |
+
pathspec==1.0.4
|
| 17 |
+
mkl_fft==1.3.11
|
| 18 |
+
prometheus_client==0.25.0
|
| 19 |
+
async-timeout==5.0.1
|
| 20 |
+
scikit-learn==1.7.2
|
| 21 |
+
sortedcontainers==2.4.0
|
| 22 |
+
Bottleneck==1.4.2
|
| 23 |
+
orjson==3.11.8
|
| 24 |
+
nest-asyncio==1.6.0
|
| 25 |
+
cupy-cuda12x==13.6.0
|
| 26 |
+
semantic-version==2.10.0
|
| 27 |
+
aiosignal==1.4.0
|
| 28 |
+
fsspec==2025.3.0
|
| 29 |
+
dyNET38==2.2
|
| 30 |
+
shellingham==1.5.4
|
| 31 |
+
zstandard==0.25.0
|
| 32 |
+
PyYAML==6.0.3
|
| 33 |
+
nvidia-curand-cu12==10.3.5.147
|
| 34 |
+
gradio==5.50.0
|
| 35 |
+
Werkzeug==3.1.8
|
| 36 |
+
grpcio==1.80.0
|
| 37 |
+
aiohttp==3.13.5
|
| 38 |
+
Flask==3.1.3
|
| 39 |
+
python-json-logger==4.1.0
|
| 40 |
+
trl==0.29.1
|
| 41 |
+
nltk==3.9.4
|
| 42 |
+
platformdirs==4.9.6
|
| 43 |
+
lm-format-enforcer==0.10.12
|
| 44 |
+
pyparsing==3.3.2
|
| 45 |
+
jmespath==0.10.0
|
| 46 |
+
starlette==0.52.1
|
| 47 |
+
crcmod==1.7
|
| 48 |
+
dnspython==2.8.0
|
| 49 |
+
antlr4-python3-runtime==4.9.3
|
| 50 |
+
rouge==1.0.1
|
| 51 |
+
importlib_metadata==9.0.0
|
| 52 |
+
nvidia-cudnn-cu12==9.1.0.70
|
| 53 |
+
safetensors==0.7.0
|
| 54 |
+
blake3==1.0.8
|
| 55 |
+
interegular==0.3.3
|
| 56 |
+
tiktoken==0.11.0
|
| 57 |
+
pydantic_core==2.41.4
|
| 58 |
+
outlines==0.1.11
|
| 59 |
+
airportsdata==20260315
|
| 60 |
+
rich-toolkit==0.19.7
|
| 61 |
+
multiprocess==0.70.16
|
| 62 |
+
sympy==1.13.1
|
| 63 |
+
psutil==7.2.2
|
| 64 |
+
h11==0.16.0
|
| 65 |
+
anyio==4.13.0
|
| 66 |
+
Cython==3.2.4
|
| 67 |
+
outlines_core==0.1.26
|
| 68 |
+
jsonschema==4.26.0
|
| 69 |
+
nvidia-cuda-cupti-cu12==12.4.127
|
| 70 |
+
meson-python==0.19.0
|
| 71 |
+
depyf==0.18.0
|
| 72 |
+
audioread==3.1.0
|
| 73 |
+
typer==0.24.1
|
| 74 |
+
nvidia-cuda-nvrtc-cu12==12.4.127
|
| 75 |
+
joblib==1.5.3
|
| 76 |
+
torchvision==0.21.0
|
| 77 |
+
hf-gradio==0.3.2
|
| 78 |
+
huggingface_hub==0.36.2
|
| 79 |
+
websockets==15.0.1
|
| 80 |
+
diskcache==5.6.3
|
| 81 |
+
mistral_common==1.11.0
|
| 82 |
+
partial-json-parser==0.2.1.1.post7
|
| 83 |
+
simplejson==3.20.2
|
| 84 |
+
watchfiles==1.1.1
|
| 85 |
+
Jinja2==3.1.6
|
| 86 |
+
GitPython==3.1.46
|
| 87 |
+
numexpr==2.11.0
|
| 88 |
+
pydub==0.25.1
|
| 89 |
+
brotli==1.2.0
|
| 90 |
+
binpacking==2.0.1
|
| 91 |
+
cmake==4.3.1
|
| 92 |
+
pydantic==2.12.3
|
| 93 |
+
mkl-service==2.4.0
|
| 94 |
+
protobuf==6.33.6
|
| 95 |
+
gguf==0.10.0
|
| 96 |
+
MarkupSafe==3.0.3
|
| 97 |
+
exceptiongroup==1.3.1
|
| 98 |
+
markdown-it-py==4.0.0
|
| 99 |
+
soxr==1.0.0
|
| 100 |
+
pyarrow==20.0.0
|
| 101 |
+
tqdm==4.67.3
|
| 102 |
+
meson==1.11.0
|
| 103 |
+
fonttools==4.62.1
|
| 104 |
+
annotated-types==0.7.0
|
| 105 |
+
networkx==3.4.2
|
| 106 |
+
nvidia-cuda-runtime-cu12==12.4.127
|
| 107 |
+
compressed-tensors==0.9.2
|
| 108 |
+
wandb==0.23.0
|
| 109 |
+
mdurl==0.1.2
|
| 110 |
+
charset-normalizer==3.4.7
|
| 111 |
+
Pygments==2.20.0
|
| 112 |
+
zipp==3.23.1
|
| 113 |
+
prometheus-fastapi-instrumentator==7.1.0
|
| 114 |
+
aiofiles==24.1.0
|
| 115 |
+
lark==1.2.2
|
| 116 |
+
addict==2.4.0
|
| 117 |
+
pydantic-settings==2.13.1
|
| 118 |
+
opencv-python-headless==4.11.0.86
|
| 119 |
+
certifi==2026.2.25
|
| 120 |
+
sox==1.5.0
|
| 121 |
+
nagisa==0.2.11
|
| 122 |
+
six==1.17.0
|
| 123 |
+
tokenizers==0.22.2
|
| 124 |
+
mkl_random==1.2.8
|
| 125 |
+
fastapi-cloud-cli==0.17.0
|
| 126 |
+
propcache==0.4.1
|
| 127 |
+
cachetools==7.0.5
|
| 128 |
+
rpds-py==0.30.0
|
| 129 |
+
torchaudio==2.6.0
|
| 130 |
+
setuptools==82.0.1
|
| 131 |
+
py-cpuinfo==9.0.0
|
| 132 |
+
tomli==2.4.1
|
| 133 |
+
xxhash==3.6.0
|
| 134 |
+
pip==26.0.1
|
| 135 |
+
contourpy==1.3.2
|
| 136 |
+
absl-py==2.4.0
|
| 137 |
+
mpmath==1.3.0
|
| 138 |
+
ms_swift==4.0.3
|
| 139 |
+
pyproject-metadata==0.11.0
|
| 140 |
+
aiohappyeyeballs==2.6.1
|
| 141 |
+
httpx==0.28.1
|
| 142 |
+
json_repair==0.59.4
|
| 143 |
+
blinker==1.9.0
|
| 144 |
+
tzdata==2025.3
|
| 145 |
+
tensorboard-data-server==0.7.2
|
| 146 |
+
pydantic-extra-types==2.11.1
|
| 147 |
+
Markdown==3.10.2
|
| 148 |
+
nvidia-cusparselt-cu12==0.6.2
|
| 149 |
+
rignore==0.7.6
|
| 150 |
+
openai==2.32.0
|
| 151 |
+
soundfile==0.13.1
|
| 152 |
+
lazy-loader==0.5
|
| 153 |
+
av==14.2.0
|
| 154 |
+
yarl==1.23.0
|
| 155 |
+
python-dateutil==2.9.0.post0
|
| 156 |
+
groovy==0.1.2
|
| 157 |
+
xformers==0.0.29.post2
|
| 158 |
+
qwen-omni-utils==0.0.9
|
| 159 |
+
rich==15.0.0
|
| 160 |
+
xgrammar==0.1.16
|
| 161 |
+
numba==0.60.0
|
| 162 |
+
nvidia-cusolver-cu12==11.6.1.9
|
| 163 |
+
scikit_build_core==0.12.2
|
| 164 |
+
ffmpy==1.0.0
|
| 165 |
+
wheel==0.46.3
|
| 166 |
+
jiter==0.14.0
|
| 167 |
+
oss2==2.19.1
|
| 168 |
+
transformers==4.57.6
|
| 169 |
+
fastrlock==0.8.3
|
| 170 |
+
click==8.3.2
|
| 171 |
+
pooch==1.9.0
|
| 172 |
+
distro==1.9.0
|
| 173 |
+
nvidia-cublas-cu12==12.4.5.8
|
| 174 |
+
regex==2026.4.4
|
| 175 |
+
cpm-kernels==1.0.11
|
| 176 |
+
safehttpx==0.1.7
|
| 177 |
+
matplotlib==3.10.8
|
| 178 |
+
httptools==0.7.1
|
| 179 |
+
nvidia-cusparse-cu12==12.3.1.170
|
| 180 |
+
qwen-asr==0.0.6
|
| 181 |
+
gradio_client==1.14.0
|
| 182 |
+
gitdb==4.0.12
|
| 183 |
+
fastapi-cli==0.0.24
|
| 184 |
+
soynlp==0.0.493
|
| 185 |
+
python-dotenv==1.2.2
|
| 186 |
+
nvidia-cufft-cu12==11.2.1.3
|
| 187 |
+
accelerate==1.12.0
|
| 188 |
+
tomlkit==0.13.3
|
| 189 |
+
triton==3.2.0
|
| 190 |
+
filelock==3.28.0
|
| 191 |
+
pycountry==26.2.16
|
| 192 |
+
modelscope==1.35.4
|
| 193 |
+
annotated-doc==0.0.4
|
| 194 |
+
referencing==0.37.0
|
| 195 |
+
numpy==1.26.4
|
| 196 |
+
aliyun-python-sdk-core==2.16.0
|
| 197 |
+
attrs==26.1.0
|
| 198 |
+
vllm==0.8.0
|
| 199 |
+
python-multipart==0.0.26
|
| 200 |
+
jsonschema-specifications==2025.9.1
|
| 201 |
+
idna==3.11
|
| 202 |
+
scipy==1.15.3
|
| 203 |
+
typing_extensions==4.15.0
|
| 204 |
+
itsdangerous==2.2.0
|
| 205 |
+
msgspec==0.21.1
|
| 206 |
+
msgpack==1.1.2
|
| 207 |
+
nvidia-nvjitlink-cu12==12.4.127
|
| 208 |
+
pycryptodome==3.23.0
|
| 209 |
+
ninja==1.13.0
|
| 210 |
+
pillow==11.3.0
|
| 211 |
+
email-validator==2.3.0
|
| 212 |
+
cryptography==46.0.7
|
| 213 |
+
peft==0.18.1
|
| 214 |
+
kiwisolver==1.5.0
|
| 215 |
+
cffi==2.0.0
|
| 216 |
+
einops==0.8.2
|
| 217 |
+
pytz==2026.1.post1
|
| 218 |
+
uvloop==0.22.1
|
| 219 |
+
requests==2.33.1
|
| 220 |
+
sentencepiece==0.2.1
|
| 221 |
+
attrdict==2.0.1
|
| 222 |
+
dacite==1.9.2
|
| 223 |
+
cloudpickle==3.1.2
|
| 224 |
+
ray==2.55.0
|
| 225 |
+
fastapi==0.135.3
|
| 226 |
+
librosa==0.11.0
|
| 227 |
+
ruff==0.15.10
|
| 228 |
+
multidict==6.7.1
|
| 229 |
+
smmap==5.0.3
|
| 230 |
+
packaging==26.0
|
| 231 |
+
pycparser==3.0
|
| 232 |
+
decorator==5.2.1
|
| 233 |
+
transformers-stream-generator==0.0.5
|
| 234 |
+
nvidia-nccl-cu12==2.21.5
|
| 235 |
+
frozenlist==1.8.0
|
| 236 |
+
uvicorn==0.44.0
|
| 237 |
+
datasets==3.6.0
|
| 238 |
+
cycler==0.12.1
|
| 239 |
+
omegaconf==2.3.0
|
| 240 |
+
httpcore==1.0.9
|
| 241 |
+
pandas==2.3.2
|
| 242 |
+
nvidia-nvtx-cu12==12.4.127
|
| 243 |
+
sentry-sdk==2.58.0
|
| 244 |
+
wheel==0.46.3
|
| 245 |
+
autocommand==2.2.2
|
| 246 |
+
tomli==2.4.0
|
| 247 |
+
packaging==26.0
|
| 248 |
+
more-itertools==10.8.0
|
| 249 |
+
zipp==3.23.0
|
| 250 |
+
platformdirs==4.4.0
|
| 251 |
+
jaraco.context==6.1.0
|
| 252 |
+
jaraco.text==4.0.0
|
| 253 |
+
backports.tarfile==1.2.0
|
| 254 |
+
jaraco.functools==4.4.0
|
| 255 |
+
importlib_metadata==8.7.1
|
wandb/run-20260417_122253-6ntp64iz/files/wandb-metadata.json
ADDED
|
@@ -0,0 +1,223 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"os": "Linux-3.10.0-957.el7.x86_64-x86_64-with-glibc2.17",
|
| 3 |
+
"python": "CPython 3.10.18",
|
| 4 |
+
"startedAt": "2026-04-17T04:22:53.361994Z",
|
| 5 |
+
"args": [
|
| 6 |
+
"--rlhf_type",
|
| 7 |
+
"grpo",
|
| 8 |
+
"--external_plugins",
|
| 9 |
+
"/mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/0416upload/my_qwen3_asr_dapo_register.py",
|
| 10 |
+
"/mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/0416upload/0417_reward.py",
|
| 11 |
+
"--model",
|
| 12 |
+
"/mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/qwen3-asr-merged",
|
| 13 |
+
"--model_type",
|
| 14 |
+
"my_qwen3_asr_rl",
|
| 15 |
+
"--template",
|
| 16 |
+
"my_qwen3_asr_rl",
|
| 17 |
+
"--dataset",
|
| 18 |
+
"/mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/0416upload/lora_0323_10w+55w+error+syn_with_domain_train90_targeted_rl_train90_loramerged_basewer_3suppress_server.jsonl",
|
| 19 |
+
"--val_dataset",
|
| 20 |
+
"/mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/0416upload/lora_0323_10w+55w+error+syn_with_domain_train90_targeted_rl_val5_sample5p_server.jsonl",
|
| 21 |
+
"--reward_funcs",
|
| 22 |
+
"asr_wer_sub_len_cmp_hallu_dirty_v56",
|
| 23 |
+
"--train_type",
|
| 24 |
+
"lora",
|
| 25 |
+
"--use_vllm",
|
| 26 |
+
"false",
|
| 27 |
+
"--log_completions",
|
| 28 |
+
"true",
|
| 29 |
+
"--loss_type",
|
| 30 |
+
"dapo",
|
| 31 |
+
"--advantage_estimator",
|
| 32 |
+
"grpo",
|
| 33 |
+
"--scale_rewards",
|
| 34 |
+
"group",
|
| 35 |
+
"--num_iterations",
|
| 36 |
+
"2",
|
| 37 |
+
"--beta",
|
| 38 |
+
"0.04",
|
| 39 |
+
"--epsilon_high",
|
| 40 |
+
"0.28",
|
| 41 |
+
"--dynamic_sample",
|
| 42 |
+
"true",
|
| 43 |
+
"--max_resample_times",
|
| 44 |
+
"4",
|
| 45 |
+
"--overlong_filter",
|
| 46 |
+
"true",
|
| 47 |
+
"--truncation_strategy",
|
| 48 |
+
"delete",
|
| 49 |
+
"--num_generations",
|
| 50 |
+
"12",
|
| 51 |
+
"--generation_batch_size",
|
| 52 |
+
"48",
|
| 53 |
+
"--per_device_train_batch_size",
|
| 54 |
+
"8",
|
| 55 |
+
"--per_device_eval_batch_size",
|
| 56 |
+
"8",
|
| 57 |
+
"--gradient_accumulation_steps",
|
| 58 |
+
"12",
|
| 59 |
+
"--num_generations_eval",
|
| 60 |
+
"4",
|
| 61 |
+
"--max_completion_length",
|
| 62 |
+
"256",
|
| 63 |
+
"--temperature",
|
| 64 |
+
"0.50",
|
| 65 |
+
"--top_p",
|
| 66 |
+
"0.95",
|
| 67 |
+
"--top_k",
|
| 68 |
+
"50",
|
| 69 |
+
"--repetition_penalty",
|
| 70 |
+
"1.08",
|
| 71 |
+
"--learning_rate",
|
| 72 |
+
"5e-5",
|
| 73 |
+
"--lr_scheduler_type",
|
| 74 |
+
"cosine",
|
| 75 |
+
"--warmup_ratio",
|
| 76 |
+
"0.03",
|
| 77 |
+
"--report_to",
|
| 78 |
+
"wandb",
|
| 79 |
+
"--run_name",
|
| 80 |
+
"qwen3asr_dapo_reward56_4x4x12_12gen_4GPU",
|
| 81 |
+
"--output_dir",
|
| 82 |
+
"/mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/0416upload/out/qwen3asr_dapo_reward56_4x4x12_12gen_4GPU",
|
| 83 |
+
"--save_strategy",
|
| 84 |
+
"steps",
|
| 85 |
+
"--save_steps",
|
| 86 |
+
"20",
|
| 87 |
+
"--logging_steps",
|
| 88 |
+
"5",
|
| 89 |
+
"--freeze_llm",
|
| 90 |
+
"false",
|
| 91 |
+
"--freeze_vit",
|
| 92 |
+
"false",
|
| 93 |
+
"--freeze_aligner",
|
| 94 |
+
"false",
|
| 95 |
+
"--remove_unused_columns",
|
| 96 |
+
"false",
|
| 97 |
+
"--padding_side",
|
| 98 |
+
"left"
|
| 99 |
+
],
|
| 100 |
+
"program": "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/lib/python3.10/site-packages/swift/cli/rlhf.py",
|
| 101 |
+
"email": "pang_kaiyu@163.com",
|
| 102 |
+
"root": "/mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/0416upload",
|
| 103 |
+
"host": "SH-IDC1-10-140-37-95",
|
| 104 |
+
"executable": "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/bin/python3.10",
|
| 105 |
+
"cpu_count": 64,
|
| 106 |
+
"cpu_count_logical": 128,
|
| 107 |
+
"gpu": "NVIDIA A100-SXM4-80GB",
|
| 108 |
+
"gpu_count": 8,
|
| 109 |
+
"disk": {
|
| 110 |
+
"/": {
|
| 111 |
+
"total": "524945911808",
|
| 112 |
+
"used": "37367128064"
|
| 113 |
+
}
|
| 114 |
+
},
|
| 115 |
+
"memory": {
|
| 116 |
+
"total": "1081627828224"
|
| 117 |
+
},
|
| 118 |
+
"gpu_nvidia": [
|
| 119 |
+
{
|
| 120 |
+
"name": "NVIDIA A100-SXM4-80GB",
|
| 121 |
+
"memoryTotal": "85899345920",
|
| 122 |
+
"cudaCores": 6912,
|
| 123 |
+
"architecture": "Ampere",
|
| 124 |
+
"uuid": "GPU-87e7e3ab-b254-fc22-7407-8e2e88e9d854"
|
| 125 |
+
},
|
| 126 |
+
{
|
| 127 |
+
"name": "NVIDIA A100-SXM4-80GB",
|
| 128 |
+
"memoryTotal": "85899345920",
|
| 129 |
+
"cudaCores": 6912,
|
| 130 |
+
"architecture": "Ampere",
|
| 131 |
+
"uuid": "GPU-976db8a1-cf00-11c6-caaa-413862233fd4"
|
| 132 |
+
},
|
| 133 |
+
{
|
| 134 |
+
"name": "NVIDIA A100-SXM4-80GB",
|
| 135 |
+
"memoryTotal": "85899345920",
|
| 136 |
+
"cudaCores": 6912,
|
| 137 |
+
"architecture": "Ampere",
|
| 138 |
+
"uuid": "GPU-78b37ae8-44e0-e318-a6c0-f6f4ac78d46a"
|
| 139 |
+
},
|
| 140 |
+
{
|
| 141 |
+
"name": "NVIDIA A100-SXM4-80GB",
|
| 142 |
+
"memoryTotal": "85899345920",
|
| 143 |
+
"cudaCores": 6912,
|
| 144 |
+
"architecture": "Ampere",
|
| 145 |
+
"uuid": "GPU-840b937d-a7d4-68e7-ad57-f4568e01c3ae"
|
| 146 |
+
},
|
| 147 |
+
{
|
| 148 |
+
"name": "NVIDIA A100-SXM4-80GB",
|
| 149 |
+
"memoryTotal": "85899345920",
|
| 150 |
+
"cudaCores": 6912,
|
| 151 |
+
"architecture": "Ampere",
|
| 152 |
+
"uuid": "GPU-a9d0de54-f5b5-f83b-7bda-f53db844622d"
|
| 153 |
+
},
|
| 154 |
+
{
|
| 155 |
+
"name": "NVIDIA A100-SXM4-80GB",
|
| 156 |
+
"memoryTotal": "85899345920",
|
| 157 |
+
"cudaCores": 6912,
|
| 158 |
+
"architecture": "Ampere",
|
| 159 |
+
"uuid": "GPU-cb7d22e9-305c-c68c-64f1-599580742db0"
|
| 160 |
+
},
|
| 161 |
+
{
|
| 162 |
+
"name": "NVIDIA A100-SXM4-80GB",
|
| 163 |
+
"memoryTotal": "85899345920",
|
| 164 |
+
"cudaCores": 6912,
|
| 165 |
+
"architecture": "Ampere",
|
| 166 |
+
"uuid": "GPU-8d9704bb-4592-346f-a7f2-1a6ed8d58619"
|
| 167 |
+
},
|
| 168 |
+
{
|
| 169 |
+
"name": "NVIDIA A100-SXM4-80GB",
|
| 170 |
+
"memoryTotal": "85899345920",
|
| 171 |
+
"cudaCores": 6912,
|
| 172 |
+
"architecture": "Ampere",
|
| 173 |
+
"uuid": "GPU-3892f01b-e0b8-a9d9-0587-b5a7d2d9b5ab"
|
| 174 |
+
}
|
| 175 |
+
],
|
| 176 |
+
"cudaVersion": "12.4",
|
| 177 |
+
"slurm": {
|
| 178 |
+
"cluster_name": "cluster_sproject3",
|
| 179 |
+
"conf": "/etc/slurm/slurm.conf",
|
| 180 |
+
"cpus_on_node": "2",
|
| 181 |
+
"gtids": "0",
|
| 182 |
+
"job_account": "research",
|
| 183 |
+
"job_cpus_per_node": "2",
|
| 184 |
+
"job_gid": "800000689",
|
| 185 |
+
"job_id": "8568770",
|
| 186 |
+
"job_name": "qwen_debug",
|
| 187 |
+
"job_nodelist": "SH-IDC1-10-140-37-95",
|
| 188 |
+
"job_num_nodes": "1",
|
| 189 |
+
"job_partition": "interntmp",
|
| 190 |
+
"job_qos": "normal",
|
| 191 |
+
"job_uid": "800000689",
|
| 192 |
+
"job_user": "panjiabao",
|
| 193 |
+
"jobid": "8568770",
|
| 194 |
+
"launch_node_ipaddr": "10.140.37.164",
|
| 195 |
+
"localid": "0",
|
| 196 |
+
"nnodes": "1",
|
| 197 |
+
"nodeid": "0",
|
| 198 |
+
"nodelist": "SH-IDC1-10-140-37-95",
|
| 199 |
+
"nprocs": "1",
|
| 200 |
+
"ntasks": "1",
|
| 201 |
+
"prio_process": "0",
|
| 202 |
+
"procid": "0",
|
| 203 |
+
"srun_comm_host": "10.140.37.164",
|
| 204 |
+
"srun_comm_port": "36403",
|
| 205 |
+
"step_gpus": "6,7",
|
| 206 |
+
"step_id": "0",
|
| 207 |
+
"step_launcher_port": "36403",
|
| 208 |
+
"step_nodelist": "SH-IDC1-10-140-37-95",
|
| 209 |
+
"step_num_nodes": "1",
|
| 210 |
+
"step_num_tasks": "1",
|
| 211 |
+
"step_tasks_per_node": "1",
|
| 212 |
+
"stepid": "0",
|
| 213 |
+
"submit_dir": "/mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/0416upload",
|
| 214 |
+
"submit_host": "SH-IDC1-10-140-37-164",
|
| 215 |
+
"task_pid": "31135",
|
| 216 |
+
"tasks_per_node": "1",
|
| 217 |
+
"topology_addr": "SH-IDC1-10-140-37-95",
|
| 218 |
+
"topology_addr_pattern": "node",
|
| 219 |
+
"umask": "0002",
|
| 220 |
+
"working_cluster": "cluster_sproject3:SH-IDC1-10-140-37-161:6817:9216:109"
|
| 221 |
+
},
|
| 222 |
+
"writerId": "sxwlerlqfwjgxrof5mrowpggo62a230u"
|
| 223 |
+
}
|
wandb/run-20260417_122253-6ntp64iz/files/wandb-summary.json
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"_wandb":{"runtime":2},"_runtime":2}
|
wandb/run-20260417_122253-6ntp64iz/logs/debug-core.log
ADDED
|
@@ -0,0 +1,12 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{"time":"2026-04-17T12:22:53.678333465+08:00","level":"INFO","msg":"main: starting server","port-filename":"/tmp/tmpo93po4ye/port-45975.txt","pid":45975,"log-level":0,"disable-analytics":false,"shutdown-on-parent-exit":false,"enable-dcgm-profiling":false}
|
| 2 |
+
{"time":"2026-04-17T12:22:53.680473688+08:00","level":"INFO","msg":"server: will exit if parent process dies","ppid":45975}
|
| 3 |
+
{"time":"2026-04-17T12:22:53.680744122+08:00","level":"INFO","msg":"server: accepting connections","addr":{"Name":"/tmp/wandb-45975-46467-1709368994/socket","Net":"unix"}}
|
| 4 |
+
{"time":"2026-04-17T12:22:53.762137433+08:00","level":"INFO","msg":"connection: ManageConnectionData: new connection created","id":"1(@)"}
|
| 5 |
+
{"time":"2026-04-17T12:22:53.771267911+08:00","level":"INFO","msg":"handleInformInit: received","streamId":"6ntp64iz","id":"1(@)"}
|
| 6 |
+
{"time":"2026-04-17T12:22:54.22640511+08:00","level":"INFO","msg":"handleInformInit: stream started","streamId":"6ntp64iz","id":"1(@)"}
|
| 7 |
+
{"time":"2026-04-17T12:22:57.706591473+08:00","level":"INFO","msg":"handleInformTeardown: server teardown initiated","id":"1(@)"}
|
| 8 |
+
{"time":"2026-04-17T12:22:57.707133174+08:00","level":"INFO","msg":"server is shutting down"}
|
| 9 |
+
{"time":"2026-04-17T12:22:57.707126026+08:00","level":"INFO","msg":"connection: closing","id":"1(@)"}
|
| 10 |
+
{"time":"2026-04-17T12:22:57.707711702+08:00","level":"INFO","msg":"server: listener closed","addr":{"Name":"/tmp/wandb-45975-46467-1709368994/socket","Net":"unix"}}
|
| 11 |
+
{"time":"2026-04-17T12:22:57.708226504+08:00","level":"INFO","msg":"connection: closed successfully","id":"1(@)"}
|
| 12 |
+
{"time":"2026-04-17T12:22:57.795817111+08:00","level":"INFO","msg":"server: parent process exited, terminating service process"}
|
wandb/run-20260417_122253-6ntp64iz/logs/debug-internal.log
ADDED
|
@@ -0,0 +1,7 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{"time":"2026-04-17T12:22:53.773961459+08:00","level":"INFO","msg":"stream: starting","core version":"0.23.0"}
|
| 2 |
+
{"time":"2026-04-17T12:22:54.222742714+08:00","level":"INFO","msg":"stream: created new stream","id":"6ntp64iz"}
|
| 3 |
+
{"time":"2026-04-17T12:22:54.222847789+08:00","level":"INFO","msg":"handler: started","stream_id":"6ntp64iz"}
|
| 4 |
+
{"time":"2026-04-17T12:22:54.226396493+08:00","level":"INFO","msg":"stream: started","id":"6ntp64iz"}
|
| 5 |
+
{"time":"2026-04-17T12:22:54.22641049+08:00","level":"INFO","msg":"sender: started","stream_id":"6ntp64iz"}
|
| 6 |
+
{"time":"2026-04-17T12:22:54.226419522+08:00","level":"INFO","msg":"writer: started","stream_id":"6ntp64iz"}
|
| 7 |
+
{"time":"2026-04-17T12:22:57.70713564+08:00","level":"INFO","msg":"stream: closing","id":"6ntp64iz"}
|
wandb/run-20260417_122253-6ntp64iz/logs/debug.log
ADDED
|
@@ -0,0 +1,26 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
2026-04-17 12:22:53,409 INFO MainThread:45975 [wandb_setup.py:_flush():80] Current SDK version is 0.23.0
|
| 2 |
+
2026-04-17 12:22:53,409 INFO MainThread:45975 [wandb_setup.py:_flush():80] Configure stats pid to 45975
|
| 3 |
+
2026-04-17 12:22:53,409 INFO MainThread:45975 [wandb_setup.py:_flush():80] Loading settings from /mnt/petrelfs/panjiabao/.config/wandb/settings
|
| 4 |
+
2026-04-17 12:22:53,409 INFO MainThread:45975 [wandb_setup.py:_flush():80] Loading settings from /mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/0416upload/wandb/settings
|
| 5 |
+
2026-04-17 12:22:53,409 INFO MainThread:45975 [wandb_setup.py:_flush():80] Loading settings from environment variables
|
| 6 |
+
2026-04-17 12:22:53,409 INFO MainThread:45975 [wandb_init.py:setup_run_log_directory():713] Logging user logs to /mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/0416upload/wandb/run-20260417_122253-6ntp64iz/logs/debug.log
|
| 7 |
+
2026-04-17 12:22:53,409 INFO MainThread:45975 [wandb_init.py:setup_run_log_directory():714] Logging internal logs to /mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/0416upload/wandb/run-20260417_122253-6ntp64iz/logs/debug-internal.log
|
| 8 |
+
2026-04-17 12:22:53,409 INFO MainThread:45975 [wandb_init.py:init():840] calling init triggers
|
| 9 |
+
2026-04-17 12:22:53,409 INFO MainThread:45975 [wandb_init.py:init():845] wandb.init called with sweep_config: {}
|
| 10 |
+
config: {'_wandb': {}}
|
| 11 |
+
2026-04-17 12:22:53,409 INFO MainThread:45975 [wandb_init.py:init():888] starting backend
|
| 12 |
+
2026-04-17 12:22:53,762 INFO MainThread:45975 [wandb_init.py:init():891] sending inform_init request
|
| 13 |
+
2026-04-17 12:22:53,766 INFO MainThread:45975 [wandb_init.py:init():899] backend started and connected
|
| 14 |
+
2026-04-17 12:22:53,768 INFO MainThread:45975 [wandb_init.py:init():969] updated telemetry
|
| 15 |
+
2026-04-17 12:22:53,769 INFO MainThread:45975 [wandb_init.py:init():993] communicating run to backend with 90.0 second timeout
|
| 16 |
+
2026-04-17 12:22:55,268 INFO MainThread:45975 [wandb_init.py:init():1040] starting run threads in backend
|
| 17 |
+
2026-04-17 12:22:55,848 INFO MainThread:45975 [wandb_run.py:_console_start():2504] atexit reg
|
| 18 |
+
2026-04-17 12:22:55,848 INFO MainThread:45975 [wandb_run.py:_redirect():2352] redirect: wrap_raw
|
| 19 |
+
2026-04-17 12:22:55,848 INFO MainThread:45975 [wandb_run.py:_redirect():2421] Wrapping output streams.
|
| 20 |
+
2026-04-17 12:22:55,848 INFO MainThread:45975 [wandb_run.py:_redirect():2444] Redirects installed.
|
| 21 |
+
2026-04-17 12:22:55,854 INFO MainThread:45975 [wandb_init.py:init():1080] run started, returning control to user process
|
| 22 |
+
2026-04-17 12:22:55,859 INFO MainThread:45975 [wandb_run.py:_config_callback():1385] config_cb None None {'peft_config': {'default': {'task_type': 'CAUSAL_LM', 'peft_type': 'LORA', 'auto_mapping': None, 'peft_version': '0.18.1', 'base_model_name_or_path': '/mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/qwen3-asr-merged', 'revision': None, 'inference_mode': False, 'r': 8, 'target_modules': '^(thinker\\.model(?=\\.).*\\.(v_proj|down_proj|gate_proj|q_proj|o_proj|k_proj|up_proj)|thinker\\.audio_tower\\.layers(?=\\.).*\\.(v_proj|fc2|fc1|out_proj|q_proj|k_proj)|thinker\\.audio_tower\\.conv_out(?=\\.)|thinker\\.audio_tower\\.proj1(?=\\.)|thinker\\.audio_tower\\.proj2(?=\\.))$', 'exclude_modules': None, 'lora_alpha': 32, 'lora_dropout': 0.05, 'fan_in_fan_out': False, 'bias': 'none', 'use_rslora': False, 'modules_to_save': [], 'init_lora_weights': True, 'layers_to_transform': None, 'layers_pattern': None, 'rank_pattern': {}, 'alpha_pattern': {}, 'megatron_config': None, 'megatron_core': 'megatron.core', 'trainable_token_indices': None, 'loftq_config': {}, 'eva_config': None, 'corda_config': None, 'use_dora': False, 'alora_invocation_tokens': None, 'use_qalora': False, 'qalora_group_size': 16, 'layer_replication': None, 'runtime_config': {'ephemeral_gpu_offload': False}, 'lora_bias': False, 'target_parameters': None, 'arrow_config': None, 'ensure_weight_tying': False, 'lora_dtype': None, 'lorap_lr_ratio': None, 'lorap_emb_lr': 1e-06}}, 'return_dict': True, 'output_hidden_states': False, 'torchscript': False, 'dtype': 'bfloat16', 'pruned_heads': {}, 'tie_word_embeddings': True, 'chunk_size_feed_forward': 0, 'is_encoder_decoder': False, 'is_decoder': False, 'cross_attention_hidden_size': None, 'add_cross_attention': False, 'tie_encoder_decoder': False, 'architectures': ['Qwen3ASRForConditionalGeneration'], 'finetuning_task': None, 'id2label': {0: 'LABEL_0', 1: 'LABEL_1'}, 'label2id': {'LABEL_0': 0, 'LABEL_1': 1}, 'task_specific_params': None, 'problem_type': None, 'tokenizer_class': None, 'prefix': None, 'bos_token_id': None, 'pad_token_id': 151643, 'eos_token_id': 151645, 'sep_token_id': None, 'decoder_start_token_id': None, 'max_length': 20, 'min_length': 0, 'do_sample': False, 'early_stopping': False, 'num_beams': 1, 'temperature': 0.5, 'top_k': 50, 'top_p': 0.95, 'typical_p': 1.0, 'repetition_penalty': 1.08, 'length_penalty': 1.0, 'no_repeat_ngram_size': 0, 'encoder_no_repeat_ngram_size': 0, 'bad_words_ids': None, 'num_return_sequences': 1, 'output_scores': False, 'return_dict_in_generate': False, 'forced_bos_token_id': None, 'forced_eos_token_id': None, 'remove_invalid_values': False, 'exponential_decay_length_penalty': None, 'suppress_tokens': None, 'begin_suppress_tokens': None, 'num_beam_groups': 1, 'diversity_penalty': 0.0, '_name_or_path': '/mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/qwen3-asr-merged', 'transformers_version': '4.57.6', 'model_type': 'qwen3_asr', 'tf_legacy_loss': False, 'use_bfloat16': False, 'thinker_config': {'return_dict': True, 'output_hidden_states': False, 'torchscript': False, 'dtype': 'bfloat16', 'pruned_heads': {}, 'tie_word_embeddings': True, 'chunk_size_feed_forward': 0, 'is_encoder_decoder': False, 'is_decoder': False, 'cross_attention_hidden_size': None, 'add_cross_attention': False, 'tie_encoder_decoder': False, 'architectures': ['Qwen3ASRForConditionalGeneration'], 'finetuning_task': None, 'id2label': {0: 'LABEL_0', 1: 'LABEL_1'}, 'label2id': {'LABEL_0': 0, 'LABEL_1': 1}, 'task_specific_params': None, 'problem_type': None, 'tokenizer_class': None, 'prefix': None, 'bos_token_id': None, 'pad_token_id': None, 'eos_token_id': None, 'sep_token_id': None, 'decoder_start_token_id': None, 'max_length': 20, 'min_length': 0, 'do_sample': False, 'early_stopping': False, 'num_beams': 1, 'temperature': 1.0, 'top_k': 50, 'top_p': 1.0, 'typical_p': 1.0, 'repetition_penalty': 1.0, 'length_penalty': 1.0, 'no_repeat_ngram_size': 0, 'encoder_no_repeat_ngram_size': 0, 'bad_words_ids': None, 'num_return_sequences': 1, 'output_scores': False, 'return_dict_in_generate': False, 'forced_bos_token_id': None, 'forced_eos_token_id': None, 'remove_invalid_values': False, 'exponential_decay_length_penalty': None, 'suppress_tokens': None, 'begin_suppress_tokens': None, 'num_beam_groups': 1, 'diversity_penalty': 0.0, '_name_or_path': '', 'audio_end_token_id': 151670, 'model_type': 'qwen3_asr_thinker', 'tf_legacy_loss': False, 'use_bfloat16': False, 'user_token_id': 872, 'audio_start_token_id': 151669, 'initializer_range': 0.02, 'audio_config': {'return_dict': True, 'output_hidden_states': False, 'torchscript': False, 'dtype': None, 'pruned_heads': {}, 'tie_word_embeddings': True, 'chunk_size_feed_forward': 0, 'is_encoder_decoder': False, 'is_decoder': False, 'cross_attention_hidden_size': None, 'add_cross_attention': False, 'tie_encoder_decoder': False, 'architectures': None, 'finetuning_task': None, 'id2label': {0: 'LABEL_0', 1: 'LABEL_1'}, 'label2id': {'LABEL_0': 0, 'LABEL_1': 1}, 'task_specific_params': None, 'problem_type': None, 'tokenizer_class': None, 'prefix': None, 'bos_token_id': None, 'pad_token_id': None, 'eos_token_id': None, 'sep_token_id': None, 'decoder_start_token_id': None, 'max_length': 20, 'min_length': 0, 'do_sample': False, 'early_stopping': False, 'num_beams': 1, 'temperature': 1.0, 'top_k': 50, 'top_p': 1.0, 'typical_p': 1.0, 'repetition_penalty': 1.0, 'length_penalty': 1.0, 'no_repeat_ngram_size': 0, 'encoder_no_repeat_ngram_size': 0, 'bad_words_ids': None, 'num_return_sequences': 1, 'output_scores': False, 'return_dict_in_generate': False, 'forced_bos_token_id': None, 'forced_eos_token_id': None, 'remove_invalid_values': False, 'exponential_decay_length_penalty': None, 'suppress_tokens': None, 'begin_suppress_tokens': None, 'num_beam_groups': 1, 'diversity_penalty': 0.0, '_name_or_path': '', 'model_type': 'qwen3_asr_audio_encoder', 'num_hidden_layers': 24, 'tf_legacy_loss': False, 'use_bfloat16': False, 'num_mel_bins': 128, 'd_model': 1024, 'encoder_layers': 24, 'encoder_attention_heads': 16, 'encoder_ffn_dim': 4096, 'dropout': 0, 'attention_dropout': 0, 'activation_function': 'gelu', 'activation_dropout': 0, 'initializer_range': 0.02, 'scale_embedding': False, 'max_source_positions': 1500, 'n_window': 50, 'output_dim': 2048, 'n_window_infer': 800, 'conv_chunksize': 500, 'downsample_hidden_size': 480, 'output_attentions': False}, 'text_config': {'vocab_size': 151936, 'max_position_embeddings': 65536, 'hidden_size': 2048, 'intermediate_size': 6144, 'num_hidden_layers': 28, 'num_attention_heads': 16, 'num_key_value_heads': 8, 'head_dim': 128, 'hidden_act': 'silu', 'initializer_range': 0.02, 'rms_norm_eps': 1e-06, 'use_cache': False, 'rope_theta': 1000000, 'rope_scaling': {'interleaved': True, 'mrope_interleaved': True, 'mrope_section': [24, 20, 20], 'rope_type': 'default', 'type': 'default'}, 'attention_bias': False, 'attention_dropout': 0.0, 'return_dict': True, 'output_hidden_states': False, 'torchscript': False, 'dtype': None, 'pruned_heads': {}, 'tie_word_embeddings': True, 'chunk_size_feed_forward': 0, 'is_encoder_decoder': False, 'is_decoder': False, 'cross_attention_hidden_size': None, 'add_cross_attention': False, 'tie_encoder_decoder': False, 'architectures': None, 'finetuning_task': None, 'id2label': {0: 'LABEL_0', 1: 'LABEL_1'}, 'label2id': {'LABEL_0': 0, 'LABEL_1': 1}, 'task_specific_params': None, 'problem_type': None, 'tokenizer_class': None, 'prefix': None, 'bos_token_id': None, 'pad_token_id': 151643, 'eos_token_id': None, 'sep_token_id': None, 'decoder_start_token_id': None, 'max_length': 20, 'min_length': 0, 'do_sample': False, 'early_stopping': False, 'num_beams': 1, 'temperature': 1.0, 'top_k': 50, 'top_p': 1.0, 'typical_p': 1.0, 'repetition_penalty': 1.0, 'length_penalty': 1.0, 'no_repeat_ngram_size': 0, 'encoder_no_repeat_ngram_size': 0, 'bad_words_ids': None, 'num_return_sequences': 1, 'output_scores': False, 'return_dict_in_generate': False, 'forced_bos_token_id': None, 'forced_eos_token_id': None, 'remove_invalid_values': False, 'exponential_decay_length_penalty': None, 'suppress_tokens': None, 'begin_suppress_tokens': None, 'num_beam_groups': 1, 'diversity_penalty': 0.0, '_name_or_path': '', 'model_type': 'qwen3_asr_text', 'tf_legacy_loss': False, 'use_bfloat16': False, 'output_attentions': False}, 'audio_token_id': 151676, 'output_attentions': False}, 'support_languages': ['Chinese', 'English', 'Cantonese', 'Arabic', 'German', 'French', 'Spanish', 'Portuguese', 'Indonesian', 'Italian', 'Korean', 'Russian', 'Thai', 'Vietnamese', 'Japanese', 'Turkish', 'Hindi', 'Malay', 'Dutch', 'Swedish', 'Danish', 'Finnish', 'Polish', 'Czech', 'Filipino', 'Persian', 'Greek', 'Romanian', 'Hungarian', 'Macedonian'], 'output_attentions': False, 'output_dir': '/mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/0416upload/out/qwen3asr_dapo_reward56_4x4x12_12gen_4GPU/v2-20260417-122243', 'overwrite_output_dir': False, 'do_train': False, 'do_eval': True, 'do_predict': False, 'eval_strategy': 'steps', 'prediction_loss_only': False, 'per_device_train_batch_size': 8, 'per_device_eval_batch_size': 8, 'per_gpu_train_batch_size': None, 'per_gpu_eval_batch_size': None, 'gradient_accumulation_steps': 12, 'eval_accumulation_steps': None, 'eval_delay': 0, 'torch_empty_cache_steps': None, 'learning_rate': 5e-05, 'weight_decay': 0.1, 'adam_beta1': 0.9, 'adam_beta2': 0.95, 'adam_epsilon': 1e-08, 'max_grad_norm': 1.0, 'num_train_epochs': 3.0, 'max_steps': -1, 'lr_scheduler_type': 'cosine', 'lr_scheduler_kwargs': None, 'warmup_ratio': 0.03, 'warmup_steps': 0, 'log_level': 'passive', 'log_level_replica': 'warning', 'log_on_each_node': True, 'logging_dir': '/mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/0416upload/out/qwen3asr_dapo_reward56_4x4x12_12gen_4GPU/v2-20260417-122243/runs', 'logging_strategy': 'steps', 'logging_first_step': True, 'logging_steps': 5, 'logging_nan_inf_filter': True, 'save_strategy': 'steps', 'save_steps': 20, 'save_total_limit': None, 'save_safetensors': True, 'save_on_each_node': False, 'save_only_model': False, 'restore_callback_states_from_checkpoint': False, 'no_cuda': False, 'use_cpu': False, 'use_mps_device': False, 'seed': 42, 'data_seed': 42, 'jit_mode_eval': False, 'bf16': True, 'fp16': False, 'fp16_opt_level': 'O1', 'half_precision_backend': 'auto', 'bf16_full_eval': False, 'fp16_full_eval': False, 'tf32': None, 'local_rank': 0, 'ddp_backend': None, 'tpu_num_cores': None, 'tpu_metrics_debug': False, 'debug': [], 'dataloader_drop_last': True, 'eval_steps': 20, 'dataloader_num_workers': 1, 'dataloader_prefetch_factor': 2, 'past_index': -1, 'run_name': 'qwen3asr_dapo_reward56_4x4x12_12gen_4GPU', 'disable_tqdm': False, 'remove_unused_columns': False, 'label_names': None, 'load_best_model_at_end': False, 'metric_for_best_model': 'loss', 'greater_is_better': False, 'ignore_data_skip': False, 'fsdp': [], 'fsdp_min_num_params': 0, 'fsdp_config': {'min_num_params': 0, 'xla': False, 'xla_fsdp_v2': False, 'xla_fsdp_grad_ckpt': False}, 'fsdp_transformer_layer_cls_to_wrap': None, 'accelerator_config': {'split_batches': False, 'dispatch_batches': False, 'even_batches': True, 'use_seedable_sampler': True, 'non_blocking': False, 'gradient_accumulation_kwargs': None}, 'parallelism_config': None, 'deepspeed': None, 'label_smoothing_factor': 0.0, 'optim': 'adamw_torch', 'optim_args': None, 'adafactor': False, 'group_by_length': False, 'length_column_name': 'length', 'report_to': ['wandb'], 'project': 'huggingface', 'trackio_space_id': 'trackio', 'ddp_find_unused_parameters': None, 'ddp_bucket_cap_mb': None, 'ddp_broadcast_buffers': None, 'dataloader_pin_memory': True, 'dataloader_persistent_workers': False, 'skip_memory_metrics': True, 'use_legacy_prediction_loop': False, 'push_to_hub': False, 'resume_from_checkpoint': None, 'hub_model_id': None, 'hub_strategy': 'every_save', 'hub_token': '<HUB_TOKEN>', 'hub_private_repo': None, 'hub_always_push': False, 'hub_revision': None, 'gradient_checkpointing': False, 'gradient_checkpointing_kwargs': None, 'include_inputs_for_metrics': False, 'include_for_metrics': [], 'eval_do_concat_batches': True, 'fp16_backend': 'auto', 'push_to_hub_model_id': None, 'push_to_hub_organization': None, 'push_to_hub_token': '<PUSH_TO_HUB_TOKEN>', 'mp_parameters': '', 'auto_find_batch_size': False, 'full_determinism': False, 'torchdynamo': None, 'ray_scope': 'last', 'ddp_timeout': 18000000, 'torch_compile': False, 'torch_compile_backend': None, 'torch_compile_mode': None, 'include_tokens_per_second': False, 'include_num_input_tokens_seen': 'no', 'neftune_noise_alpha': None, 'optim_target_modules': None, 'batch_eval_metrics': False, 'eval_on_start': False, 'use_liger_kernel': False, 'liger_kernel_config': None, 'eval_use_gather_object': False, 'average_tokens_across_devices': True, 'model_init_kwargs': None, 'disable_dropout': False, 'cast_lm_head_to_fp32': False, 'num_generations': 12, 'num_generations_eval': 4, 'max_completion_length': 256, 'ds3_gather_for_generation': True, 'shuffle_dataset': True, 'generation_batch_size': 48, 'steps_per_generation': 3, 'min_p': None, 'generation_kwargs': None, 'chat_template_kwargs': None, 'use_transformers_paged': False, 'cache_implementation': None, 'use_vllm': False, 'vllm_mode': None, 'vllm_model_impl': 'vllm', 'vllm_enable_sleep_mode': False, 'vllm_structured_outputs_regex': None, 'vllm_server_base_url': None, 'vllm_server_host': None, 'vllm_server_port': [8000], 'vllm_server_timeout': 240.0, 'vllm_group_port': 51216, 'vllm_gpu_memory_utilization': 0.9, 'vllm_max_model_length': None, 'vllm_tensor_parallel_size': 1, 'beta': 0.04, 'num_iterations': 2, 'epsilon': 0.2, 'delta': None, 'epsilon_high': 0.28, 'sapo_temperature_neg': 1.05, 'sapo_temperature_pos': 1.0, 'importance_sampling_level': 'token', 'reward_weights': None, 'multi_objective_aggregation': 'sum_then_normalize', 'scale_rewards': 'group', 'loss_type': 'dapo', 'mask_truncated_completions': False, 'sync_ref_model': False, 'ref_model_mixup_alpha': 0.6, 'ref_model_sync_steps': 512, 'top_entropy_quantile': 1.0, 'max_tool_calling_iterations': None, 'vllm_importance_sampling_correction': True, 'vllm_importance_sampling_mode': 'sequence_mask', 'vllm_importance_sampling_cap': 3.0, 'off_policy_mask_threshold': None, 'use_bias_correction_kl': False, 'log_completions': True, 'num_completions_to_print': None, 'log_unique_prompts': False, 'log_completions_hub_repo': None, 'tuner_backend': 'peft', 'vit_gradient_checkpointing': True, 'router_aux_loss_coef': 0.0, 'enable_dft_loss': False, 'enable_channel_loss': False, 'safe_serialization': True, 'max_shard_size': '5GB', 'check_model': True, 'acc_strategy': 'token', 'train_dataloader_shuffle': True, 'max_epochs': None, 'aligner_lr': None, 'vit_lr': None, 'use_logits_to_keep': None, 'resume_only_model': False, 'optimizer': None, 'eval_metric': None, 'callbacks': [], 'early_stop_interval': None, 'eval_use_evalscope': False, 'eval_dataset': [], 'eval_dataset_args': None, 'eval_limit': None, 'eval_generation_config': None, 'extra_eval_args': None, 'tuner_type': 'lora', 'use_galore': False, 'galore_target_modules': None, 'galore_rank': 128, 'galore_update_proj_gap': 50, 'galore_scale': 1.0, 'galore_proj_type': 'std', 'galore_optim_per_parameter': False, 'galore_with_embedding': False, 'galore_quantization': False, 'galore_proj_quant': False, 'galore_proj_bits': 4, 'galore_proj_group_size': 256, 'galore_cos_threshold': 0.4, 'galore_gamma_proj': 2, 'galore_queue_size': 5, 'lisa_activated_layers': 0, 'lisa_step_interval': 20, 'use_flash_ckpt': False, 'vllm_pipeline_parallel_size': 1, 'vllm_enable_expert_parallel': False, 'vllm_max_num_seqs': None, 'vllm_max_model_len': None, 'vllm_disable_custom_all_reduce': True, 'vllm_enforce_eager': False, 'vllm_limit_mm_per_prompt': None, 'vllm_max_lora_rank': 16, 'vllm_enable_prefix_caching': True, 'vllm_use_async_engine': None, 'vllm_quantization': None, 'vllm_reasoning_parser': None, 'vllm_disable_cascade_attn': False, 'vllm_mm_processor_cache_gb': None, 'vllm_speculative_config': None, 'vllm_engine_kwargs': {}, 'vllm_data_parallel_size': 1, 'stop_words': [], 'vllm_enable_lora': False, 'lora_rank': 8, 'vllm_server_group_port': None, 'enable_flattened_weight_sync': True, 'async_generate': False, 'structured_outputs_regex': None, 'sleep_level': 0, 'move_model_batches': None, 'offload_optimizer': False, 'offload_model': False, 'wandb_log_unique_prompts': None, 'cosine_min_len_value_wrong': -0.5, 'cosine_max_len_value_wrong': 0.0, 'cosine_min_len_value_correct': 1.0, 'cosine_max_len_value_correct': 0.5, 'cosine_max_len': 256, 'repetition_n_grams': 3, 'repetition_max_penalty': -1.0, 'reward_model': None, 'reward_model_plugin': None, 'chord_sft_dataset': [], 'chord_sft_per_device_train_batch_size': None, 'chord_enable_phi_function': False, 'chord_mu_warmup_steps': None, 'chord_mu_decay_steps': None, 'chord_mu_peak': None, 'chord_mu_valley': None, 'multi_turn_scheduler': None, 'max_turns': None, 'completion_length_limit_scope': 'per_round', 'vllm_server_pass_dataset': False, 'dynamic_sample': True, 'max_resample_times': 4, 'overlong_filter': True, 'soft_max_length': None, 'soft_cache_length': None, 'log_entropy': False, 'tau_pos': 1.0, 'tau_neg': 1.05, 'advantage_estimator': 'grpo', 'kl_in_reward': False, 'dataset_shuffle': True, 'rollout_importance_sampling_mode': None, 'rollout_importance_sampling_threshold': 2.0, 'log_rollout_offpolicy_metrics': False, 'off_policy_sequence_mask_delta': None}
|
| 23 |
+
2026-04-17 12:22:55,870 INFO MainThread:45975 [wandb_config.py:__setitem__():154] [no run ID] config set model/num_parameters = 2050307712 - <bound method Run._config_callback of <wandb.sdk.wandb_run.Run object at 0x7fe90873e920>>
|
| 24 |
+
2026-04-17 12:22:55,870 INFO MainThread:45975 [wandb_run.py:_config_callback():1385] config_cb model/num_parameters 2050307712 None
|
| 25 |
+
2026-04-17 12:22:57,706 INFO wandb-AsyncioManager-main:45975 [service_client.py:_forward_responses():80] Reached EOF.
|
| 26 |
+
2026-04-17 12:22:57,707 INFO wandb-AsyncioManager-main:45975 [mailbox.py:close():137] Closing mailbox, abandoning 1 handles.
|
wandb/run-20260417_123237-3h84yfea/files/config.yaml
ADDED
|
@@ -0,0 +1,1272 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
_name_or_path:
|
| 2 |
+
value: /mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/qwen3-asr-merged
|
| 3 |
+
_wandb:
|
| 4 |
+
value:
|
| 5 |
+
cli_version: 0.23.0
|
| 6 |
+
e:
|
| 7 |
+
bpic2cpmtxvnwca2pu2tg19g1j2qwpb2:
|
| 8 |
+
args:
|
| 9 |
+
- --rlhf_type
|
| 10 |
+
- grpo
|
| 11 |
+
- --external_plugins
|
| 12 |
+
- /mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/0416upload/my_qwen3_asr_dapo_register.py
|
| 13 |
+
- /mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/0416upload/0417_reward.py
|
| 14 |
+
- --model
|
| 15 |
+
- /mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/qwen3-asr-merged
|
| 16 |
+
- --model_type
|
| 17 |
+
- my_qwen3_asr_rl
|
| 18 |
+
- --template
|
| 19 |
+
- my_qwen3_asr_rl
|
| 20 |
+
- --dataset
|
| 21 |
+
- /mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/0416upload/lora_0323_10w+55w+error+syn_with_domain_train90_targeted_rl_train90_loramerged_basewer_3suppress_server.jsonl
|
| 22 |
+
- --val_dataset
|
| 23 |
+
- /mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/0416upload/lora_0323_10w+55w+error+syn_with_domain_train90_targeted_rl_val5_sample5p_server.jsonl
|
| 24 |
+
- --reward_funcs
|
| 25 |
+
- asr_wer_sub_len_cmp_hallu_dirty_v56
|
| 26 |
+
- --train_type
|
| 27 |
+
- lora
|
| 28 |
+
- --use_vllm
|
| 29 |
+
- "false"
|
| 30 |
+
- --log_completions
|
| 31 |
+
- "true"
|
| 32 |
+
- --loss_type
|
| 33 |
+
- dapo
|
| 34 |
+
- --advantage_estimator
|
| 35 |
+
- grpo
|
| 36 |
+
- --scale_rewards
|
| 37 |
+
- group
|
| 38 |
+
- --num_iterations
|
| 39 |
+
- "2"
|
| 40 |
+
- --beta
|
| 41 |
+
- "0.04"
|
| 42 |
+
- --epsilon_high
|
| 43 |
+
- "0.28"
|
| 44 |
+
- --dynamic_sample
|
| 45 |
+
- "true"
|
| 46 |
+
- --max_resample_times
|
| 47 |
+
- "4"
|
| 48 |
+
- --overlong_filter
|
| 49 |
+
- "true"
|
| 50 |
+
- --truncation_strategy
|
| 51 |
+
- delete
|
| 52 |
+
- --num_generations
|
| 53 |
+
- "12"
|
| 54 |
+
- --generation_batch_size
|
| 55 |
+
- "48"
|
| 56 |
+
- --per_device_train_batch_size
|
| 57 |
+
- "8"
|
| 58 |
+
- --per_device_eval_batch_size
|
| 59 |
+
- "8"
|
| 60 |
+
- --gradient_accumulation_steps
|
| 61 |
+
- "12"
|
| 62 |
+
- --num_generations_eval
|
| 63 |
+
- "4"
|
| 64 |
+
- --max_completion_length
|
| 65 |
+
- "256"
|
| 66 |
+
- --temperature
|
| 67 |
+
- "0.50"
|
| 68 |
+
- --top_p
|
| 69 |
+
- "0.95"
|
| 70 |
+
- --top_k
|
| 71 |
+
- "50"
|
| 72 |
+
- --repetition_penalty
|
| 73 |
+
- "1.08"
|
| 74 |
+
- --learning_rate
|
| 75 |
+
- "5e-5"
|
| 76 |
+
- --lr_scheduler_type
|
| 77 |
+
- cosine
|
| 78 |
+
- --warmup_ratio
|
| 79 |
+
- "0.03"
|
| 80 |
+
- --report_to
|
| 81 |
+
- wandb
|
| 82 |
+
- --run_name
|
| 83 |
+
- qwen3asr_dapo_reward56_4x4x12_12gen_4GPU
|
| 84 |
+
- --output_dir
|
| 85 |
+
- /mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/0416upload/out/qwen3asr_dapo_reward56_4x4x12_12gen_4GPU
|
| 86 |
+
- --save_strategy
|
| 87 |
+
- steps
|
| 88 |
+
- --save_steps
|
| 89 |
+
- "20"
|
| 90 |
+
- --logging_steps
|
| 91 |
+
- "5"
|
| 92 |
+
- --freeze_llm
|
| 93 |
+
- "false"
|
| 94 |
+
- --freeze_vit
|
| 95 |
+
- "false"
|
| 96 |
+
- --freeze_aligner
|
| 97 |
+
- "false"
|
| 98 |
+
- --remove_unused_columns
|
| 99 |
+
- "false"
|
| 100 |
+
- --padding_side
|
| 101 |
+
- left
|
| 102 |
+
cpu_count: 64
|
| 103 |
+
cpu_count_logical: 128
|
| 104 |
+
cudaVersion: "12.4"
|
| 105 |
+
disk:
|
| 106 |
+
/:
|
| 107 |
+
total: "524945911808"
|
| 108 |
+
used: "105544630272"
|
| 109 |
+
email: pang_kaiyu@163.com
|
| 110 |
+
executable: /mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/bin/python3.10
|
| 111 |
+
gpu: NVIDIA A100-SXM4-80GB
|
| 112 |
+
gpu_count: 8
|
| 113 |
+
gpu_nvidia:
|
| 114 |
+
- architecture: Ampere
|
| 115 |
+
cudaCores: 6912
|
| 116 |
+
memoryTotal: "85899345920"
|
| 117 |
+
name: NVIDIA A100-SXM4-80GB
|
| 118 |
+
uuid: GPU-51466de9-a668-3c7e-bb90-bb8c112e0fea
|
| 119 |
+
- architecture: Ampere
|
| 120 |
+
cudaCores: 6912
|
| 121 |
+
memoryTotal: "85899345920"
|
| 122 |
+
name: NVIDIA A100-SXM4-80GB
|
| 123 |
+
uuid: GPU-ec1a5f87-66dd-26c2-5656-b57c7015a595
|
| 124 |
+
- architecture: Ampere
|
| 125 |
+
cudaCores: 6912
|
| 126 |
+
memoryTotal: "85899345920"
|
| 127 |
+
name: NVIDIA A100-SXM4-80GB
|
| 128 |
+
uuid: GPU-2dabb104-8ec6-09ec-017a-204779e18c19
|
| 129 |
+
- architecture: Ampere
|
| 130 |
+
cudaCores: 6912
|
| 131 |
+
memoryTotal: "85899345920"
|
| 132 |
+
name: NVIDIA A100-SXM4-80GB
|
| 133 |
+
uuid: GPU-0e67540a-1930-f39b-320f-0a6bfe1da2e0
|
| 134 |
+
- architecture: Ampere
|
| 135 |
+
cudaCores: 6912
|
| 136 |
+
memoryTotal: "85899345920"
|
| 137 |
+
name: NVIDIA A100-SXM4-80GB
|
| 138 |
+
uuid: GPU-b46e583c-5ac8-e350-6045-49ad7b17c092
|
| 139 |
+
- architecture: Ampere
|
| 140 |
+
cudaCores: 6912
|
| 141 |
+
memoryTotal: "85899345920"
|
| 142 |
+
name: NVIDIA A100-SXM4-80GB
|
| 143 |
+
uuid: GPU-f293d16a-41a0-fbc1-e86c-4f9682cb5e2b
|
| 144 |
+
- architecture: Ampere
|
| 145 |
+
cudaCores: 6912
|
| 146 |
+
memoryTotal: "85899345920"
|
| 147 |
+
name: NVIDIA A100-SXM4-80GB
|
| 148 |
+
uuid: GPU-67958330-9199-dca8-5c2e-c665b13b3452
|
| 149 |
+
- architecture: Ampere
|
| 150 |
+
cudaCores: 6912
|
| 151 |
+
memoryTotal: "85899345920"
|
| 152 |
+
name: NVIDIA A100-SXM4-80GB
|
| 153 |
+
uuid: GPU-6b56602f-4dcf-cb9d-4e98-04bf6254b789
|
| 154 |
+
host: SH-IDC1-10-140-37-1
|
| 155 |
+
memory:
|
| 156 |
+
total: "1081627828224"
|
| 157 |
+
os: Linux-3.10.0-957.el7.x86_64-x86_64-with-glibc2.17
|
| 158 |
+
program: /mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/lib/python3.10/site-packages/swift/cli/rlhf.py
|
| 159 |
+
python: CPython 3.10.18
|
| 160 |
+
root: /mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/0416upload
|
| 161 |
+
slurm:
|
| 162 |
+
cluster_name: cluster_sproject3
|
| 163 |
+
conf: /etc/slurm/slurm.conf
|
| 164 |
+
cpus_on_node: "2"
|
| 165 |
+
gtids: "0"
|
| 166 |
+
job_account: research
|
| 167 |
+
job_cpus_per_node: "2"
|
| 168 |
+
job_gid: "800000689"
|
| 169 |
+
job_id: "8568802"
|
| 170 |
+
job_name: qwen_debug
|
| 171 |
+
job_nodelist: SH-IDC1-10-140-37-1
|
| 172 |
+
job_num_nodes: "1"
|
| 173 |
+
job_partition: interntmp
|
| 174 |
+
job_qos: normal
|
| 175 |
+
job_uid: "800000689"
|
| 176 |
+
job_user: panjiabao
|
| 177 |
+
jobid: "8568802"
|
| 178 |
+
launch_node_ipaddr: 10.140.37.164
|
| 179 |
+
localid: "0"
|
| 180 |
+
nnodes: "1"
|
| 181 |
+
nodeid: "0"
|
| 182 |
+
nodelist: SH-IDC1-10-140-37-1
|
| 183 |
+
nprocs: "1"
|
| 184 |
+
ntasks: "1"
|
| 185 |
+
prio_process: "0"
|
| 186 |
+
procid: "0"
|
| 187 |
+
srun_comm_host: 10.140.37.164
|
| 188 |
+
srun_comm_port: "44570"
|
| 189 |
+
step_gpus: 4,5
|
| 190 |
+
step_id: "0"
|
| 191 |
+
step_launcher_port: "44570"
|
| 192 |
+
step_nodelist: SH-IDC1-10-140-37-1
|
| 193 |
+
step_num_nodes: "1"
|
| 194 |
+
step_num_tasks: "1"
|
| 195 |
+
step_tasks_per_node: "1"
|
| 196 |
+
stepid: "0"
|
| 197 |
+
submit_dir: /mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/0416upload
|
| 198 |
+
submit_host: SH-IDC1-10-140-37-164
|
| 199 |
+
task_pid: "24357"
|
| 200 |
+
tasks_per_node: "1"
|
| 201 |
+
topology_addr: SH-IDC1-10-140-37-1
|
| 202 |
+
topology_addr_pattern: node
|
| 203 |
+
umask: "0002"
|
| 204 |
+
working_cluster: cluster_sproject3:SH-IDC1-10-140-37-161:6817:9216:109
|
| 205 |
+
startedAt: "2026-04-17T04:32:37.414555Z"
|
| 206 |
+
writerId: bpic2cpmtxvnwca2pu2tg19g1j2qwpb2
|
| 207 |
+
m:
|
| 208 |
+
- "1": train/global_step
|
| 209 |
+
"6":
|
| 210 |
+
- 3
|
| 211 |
+
"7": []
|
| 212 |
+
- "2": '*'
|
| 213 |
+
"5": 1
|
| 214 |
+
"6":
|
| 215 |
+
- 1
|
| 216 |
+
"7": []
|
| 217 |
+
python_version: 3.10.18
|
| 218 |
+
t:
|
| 219 |
+
"1":
|
| 220 |
+
- 1
|
| 221 |
+
- 5
|
| 222 |
+
- 11
|
| 223 |
+
- 30
|
| 224 |
+
- 41
|
| 225 |
+
- 49
|
| 226 |
+
- 51
|
| 227 |
+
- 53
|
| 228 |
+
- 71
|
| 229 |
+
- 84
|
| 230 |
+
- 95
|
| 231 |
+
- 98
|
| 232 |
+
- 105
|
| 233 |
+
"2":
|
| 234 |
+
- 1
|
| 235 |
+
- 5
|
| 236 |
+
- 11
|
| 237 |
+
- 30
|
| 238 |
+
- 41
|
| 239 |
+
- 49
|
| 240 |
+
- 51
|
| 241 |
+
- 53
|
| 242 |
+
- 71
|
| 243 |
+
- 84
|
| 244 |
+
- 95
|
| 245 |
+
- 98
|
| 246 |
+
- 105
|
| 247 |
+
"3":
|
| 248 |
+
- 7
|
| 249 |
+
- 13
|
| 250 |
+
- 19
|
| 251 |
+
- 66
|
| 252 |
+
"4": 3.10.18
|
| 253 |
+
"5": 0.23.0
|
| 254 |
+
"6": 4.57.6
|
| 255 |
+
"9":
|
| 256 |
+
"1": transformers_trainer
|
| 257 |
+
"12": 0.23.0
|
| 258 |
+
"13": linux-x86_64
|
| 259 |
+
acc_strategy:
|
| 260 |
+
value: token
|
| 261 |
+
accelerator_config:
|
| 262 |
+
value:
|
| 263 |
+
dispatch_batches: false
|
| 264 |
+
even_batches: true
|
| 265 |
+
gradient_accumulation_kwargs: null
|
| 266 |
+
non_blocking: false
|
| 267 |
+
split_batches: false
|
| 268 |
+
use_seedable_sampler: true
|
| 269 |
+
adafactor:
|
| 270 |
+
value: false
|
| 271 |
+
adam_beta1:
|
| 272 |
+
value: 0.9
|
| 273 |
+
adam_beta2:
|
| 274 |
+
value: 0.95
|
| 275 |
+
adam_epsilon:
|
| 276 |
+
value: 1e-08
|
| 277 |
+
add_cross_attention:
|
| 278 |
+
value: false
|
| 279 |
+
advantage_estimator:
|
| 280 |
+
value: grpo
|
| 281 |
+
aligner_lr:
|
| 282 |
+
value: null
|
| 283 |
+
architectures:
|
| 284 |
+
value:
|
| 285 |
+
- Qwen3ASRForConditionalGeneration
|
| 286 |
+
async_generate:
|
| 287 |
+
value: false
|
| 288 |
+
auto_find_batch_size:
|
| 289 |
+
value: false
|
| 290 |
+
average_tokens_across_devices:
|
| 291 |
+
value: true
|
| 292 |
+
bad_words_ids:
|
| 293 |
+
value: null
|
| 294 |
+
batch_eval_metrics:
|
| 295 |
+
value: false
|
| 296 |
+
begin_suppress_tokens:
|
| 297 |
+
value: null
|
| 298 |
+
beta:
|
| 299 |
+
value: 0.04
|
| 300 |
+
bf16:
|
| 301 |
+
value: true
|
| 302 |
+
bf16_full_eval:
|
| 303 |
+
value: false
|
| 304 |
+
bos_token_id:
|
| 305 |
+
value: null
|
| 306 |
+
cache_implementation:
|
| 307 |
+
value: null
|
| 308 |
+
callbacks:
|
| 309 |
+
value: []
|
| 310 |
+
cast_lm_head_to_fp32:
|
| 311 |
+
value: false
|
| 312 |
+
chat_template_kwargs:
|
| 313 |
+
value: null
|
| 314 |
+
check_model:
|
| 315 |
+
value: true
|
| 316 |
+
chord_enable_phi_function:
|
| 317 |
+
value: false
|
| 318 |
+
chord_mu_decay_steps:
|
| 319 |
+
value: null
|
| 320 |
+
chord_mu_peak:
|
| 321 |
+
value: null
|
| 322 |
+
chord_mu_valley:
|
| 323 |
+
value: null
|
| 324 |
+
chord_mu_warmup_steps:
|
| 325 |
+
value: null
|
| 326 |
+
chord_sft_dataset:
|
| 327 |
+
value: []
|
| 328 |
+
chord_sft_per_device_train_batch_size:
|
| 329 |
+
value: null
|
| 330 |
+
chunk_size_feed_forward:
|
| 331 |
+
value: 0
|
| 332 |
+
completion_length_limit_scope:
|
| 333 |
+
value: per_round
|
| 334 |
+
cosine_max_len:
|
| 335 |
+
value: 256
|
| 336 |
+
cosine_max_len_value_correct:
|
| 337 |
+
value: 0.5
|
| 338 |
+
cosine_max_len_value_wrong:
|
| 339 |
+
value: 0
|
| 340 |
+
cosine_min_len_value_correct:
|
| 341 |
+
value: 1
|
| 342 |
+
cosine_min_len_value_wrong:
|
| 343 |
+
value: -0.5
|
| 344 |
+
cross_attention_hidden_size:
|
| 345 |
+
value: null
|
| 346 |
+
data_seed:
|
| 347 |
+
value: 42
|
| 348 |
+
dataloader_drop_last:
|
| 349 |
+
value: true
|
| 350 |
+
dataloader_num_workers:
|
| 351 |
+
value: 1
|
| 352 |
+
dataloader_persistent_workers:
|
| 353 |
+
value: false
|
| 354 |
+
dataloader_pin_memory:
|
| 355 |
+
value: true
|
| 356 |
+
dataloader_prefetch_factor:
|
| 357 |
+
value: 2
|
| 358 |
+
dataset_shuffle:
|
| 359 |
+
value: true
|
| 360 |
+
ddp_backend:
|
| 361 |
+
value: null
|
| 362 |
+
ddp_broadcast_buffers:
|
| 363 |
+
value: null
|
| 364 |
+
ddp_bucket_cap_mb:
|
| 365 |
+
value: null
|
| 366 |
+
ddp_find_unused_parameters:
|
| 367 |
+
value: null
|
| 368 |
+
ddp_timeout:
|
| 369 |
+
value: 18000000
|
| 370 |
+
debug:
|
| 371 |
+
value: []
|
| 372 |
+
decoder_start_token_id:
|
| 373 |
+
value: null
|
| 374 |
+
deepspeed:
|
| 375 |
+
value: null
|
| 376 |
+
delta:
|
| 377 |
+
value: null
|
| 378 |
+
disable_dropout:
|
| 379 |
+
value: false
|
| 380 |
+
disable_tqdm:
|
| 381 |
+
value: false
|
| 382 |
+
diversity_penalty:
|
| 383 |
+
value: 0
|
| 384 |
+
do_eval:
|
| 385 |
+
value: true
|
| 386 |
+
do_predict:
|
| 387 |
+
value: false
|
| 388 |
+
do_sample:
|
| 389 |
+
value: false
|
| 390 |
+
do_train:
|
| 391 |
+
value: false
|
| 392 |
+
ds3_gather_for_generation:
|
| 393 |
+
value: true
|
| 394 |
+
dtype:
|
| 395 |
+
value: bfloat16
|
| 396 |
+
dynamic_sample:
|
| 397 |
+
value: true
|
| 398 |
+
early_stop_interval:
|
| 399 |
+
value: null
|
| 400 |
+
early_stopping:
|
| 401 |
+
value: false
|
| 402 |
+
enable_channel_loss:
|
| 403 |
+
value: false
|
| 404 |
+
enable_dft_loss:
|
| 405 |
+
value: false
|
| 406 |
+
enable_flattened_weight_sync:
|
| 407 |
+
value: true
|
| 408 |
+
encoder_no_repeat_ngram_size:
|
| 409 |
+
value: 0
|
| 410 |
+
eos_token_id:
|
| 411 |
+
value: 151645
|
| 412 |
+
epsilon:
|
| 413 |
+
value: 0.2
|
| 414 |
+
epsilon_high:
|
| 415 |
+
value: 0.28
|
| 416 |
+
eval_accumulation_steps:
|
| 417 |
+
value: null
|
| 418 |
+
eval_dataset:
|
| 419 |
+
value: []
|
| 420 |
+
eval_dataset_args:
|
| 421 |
+
value: null
|
| 422 |
+
eval_delay:
|
| 423 |
+
value: 0
|
| 424 |
+
eval_do_concat_batches:
|
| 425 |
+
value: true
|
| 426 |
+
eval_generation_config:
|
| 427 |
+
value: null
|
| 428 |
+
eval_limit:
|
| 429 |
+
value: null
|
| 430 |
+
eval_metric:
|
| 431 |
+
value: null
|
| 432 |
+
eval_on_start:
|
| 433 |
+
value: false
|
| 434 |
+
eval_steps:
|
| 435 |
+
value: 20
|
| 436 |
+
eval_strategy:
|
| 437 |
+
value: steps
|
| 438 |
+
eval_use_evalscope:
|
| 439 |
+
value: false
|
| 440 |
+
eval_use_gather_object:
|
| 441 |
+
value: false
|
| 442 |
+
exponential_decay_length_penalty:
|
| 443 |
+
value: null
|
| 444 |
+
extra_eval_args:
|
| 445 |
+
value: null
|
| 446 |
+
finetuning_task:
|
| 447 |
+
value: null
|
| 448 |
+
forced_bos_token_id:
|
| 449 |
+
value: null
|
| 450 |
+
forced_eos_token_id:
|
| 451 |
+
value: null
|
| 452 |
+
fp16:
|
| 453 |
+
value: false
|
| 454 |
+
fp16_backend:
|
| 455 |
+
value: auto
|
| 456 |
+
fp16_full_eval:
|
| 457 |
+
value: false
|
| 458 |
+
fp16_opt_level:
|
| 459 |
+
value: O1
|
| 460 |
+
fsdp:
|
| 461 |
+
value: []
|
| 462 |
+
fsdp_config:
|
| 463 |
+
value:
|
| 464 |
+
min_num_params: 0
|
| 465 |
+
xla: false
|
| 466 |
+
xla_fsdp_grad_ckpt: false
|
| 467 |
+
xla_fsdp_v2: false
|
| 468 |
+
fsdp_min_num_params:
|
| 469 |
+
value: 0
|
| 470 |
+
fsdp_transformer_layer_cls_to_wrap:
|
| 471 |
+
value: null
|
| 472 |
+
full_determinism:
|
| 473 |
+
value: false
|
| 474 |
+
galore_cos_threshold:
|
| 475 |
+
value: 0.4
|
| 476 |
+
galore_gamma_proj:
|
| 477 |
+
value: 2
|
| 478 |
+
galore_optim_per_parameter:
|
| 479 |
+
value: false
|
| 480 |
+
galore_proj_bits:
|
| 481 |
+
value: 4
|
| 482 |
+
galore_proj_group_size:
|
| 483 |
+
value: 256
|
| 484 |
+
galore_proj_quant:
|
| 485 |
+
value: false
|
| 486 |
+
galore_proj_type:
|
| 487 |
+
value: std
|
| 488 |
+
galore_quantization:
|
| 489 |
+
value: false
|
| 490 |
+
galore_queue_size:
|
| 491 |
+
value: 5
|
| 492 |
+
galore_rank:
|
| 493 |
+
value: 128
|
| 494 |
+
galore_scale:
|
| 495 |
+
value: 1
|
| 496 |
+
galore_target_modules:
|
| 497 |
+
value: null
|
| 498 |
+
galore_update_proj_gap:
|
| 499 |
+
value: 50
|
| 500 |
+
galore_with_embedding:
|
| 501 |
+
value: false
|
| 502 |
+
generation_batch_size:
|
| 503 |
+
value: 48
|
| 504 |
+
generation_kwargs:
|
| 505 |
+
value: null
|
| 506 |
+
gradient_accumulation_steps:
|
| 507 |
+
value: 12
|
| 508 |
+
gradient_checkpointing:
|
| 509 |
+
value: false
|
| 510 |
+
gradient_checkpointing_kwargs:
|
| 511 |
+
value: null
|
| 512 |
+
greater_is_better:
|
| 513 |
+
value: false
|
| 514 |
+
group_by_length:
|
| 515 |
+
value: false
|
| 516 |
+
half_precision_backend:
|
| 517 |
+
value: auto
|
| 518 |
+
hub_always_push:
|
| 519 |
+
value: false
|
| 520 |
+
hub_model_id:
|
| 521 |
+
value: null
|
| 522 |
+
hub_private_repo:
|
| 523 |
+
value: null
|
| 524 |
+
hub_revision:
|
| 525 |
+
value: null
|
| 526 |
+
hub_strategy:
|
| 527 |
+
value: every_save
|
| 528 |
+
hub_token:
|
| 529 |
+
value: <HUB_TOKEN>
|
| 530 |
+
id2label:
|
| 531 |
+
value:
|
| 532 |
+
"0": LABEL_0
|
| 533 |
+
"1": LABEL_1
|
| 534 |
+
ignore_data_skip:
|
| 535 |
+
value: false
|
| 536 |
+
importance_sampling_level:
|
| 537 |
+
value: token
|
| 538 |
+
include_for_metrics:
|
| 539 |
+
value: []
|
| 540 |
+
include_inputs_for_metrics:
|
| 541 |
+
value: false
|
| 542 |
+
include_num_input_tokens_seen:
|
| 543 |
+
value: "no"
|
| 544 |
+
include_tokens_per_second:
|
| 545 |
+
value: false
|
| 546 |
+
is_decoder:
|
| 547 |
+
value: false
|
| 548 |
+
is_encoder_decoder:
|
| 549 |
+
value: false
|
| 550 |
+
jit_mode_eval:
|
| 551 |
+
value: false
|
| 552 |
+
kl_in_reward:
|
| 553 |
+
value: false
|
| 554 |
+
label_names:
|
| 555 |
+
value: null
|
| 556 |
+
label_smoothing_factor:
|
| 557 |
+
value: 0
|
| 558 |
+
label2id:
|
| 559 |
+
value:
|
| 560 |
+
LABEL_0: 0
|
| 561 |
+
LABEL_1: 1
|
| 562 |
+
learning_rate:
|
| 563 |
+
value: 5e-05
|
| 564 |
+
length_column_name:
|
| 565 |
+
value: length
|
| 566 |
+
length_penalty:
|
| 567 |
+
value: 1
|
| 568 |
+
liger_kernel_config:
|
| 569 |
+
value: null
|
| 570 |
+
lisa_activated_layers:
|
| 571 |
+
value: 0
|
| 572 |
+
lisa_step_interval:
|
| 573 |
+
value: 20
|
| 574 |
+
load_best_model_at_end:
|
| 575 |
+
value: false
|
| 576 |
+
local_rank:
|
| 577 |
+
value: 0
|
| 578 |
+
log_completions:
|
| 579 |
+
value: true
|
| 580 |
+
log_completions_hub_repo:
|
| 581 |
+
value: null
|
| 582 |
+
log_entropy:
|
| 583 |
+
value: false
|
| 584 |
+
log_level:
|
| 585 |
+
value: passive
|
| 586 |
+
log_level_replica:
|
| 587 |
+
value: warning
|
| 588 |
+
log_on_each_node:
|
| 589 |
+
value: true
|
| 590 |
+
log_rollout_offpolicy_metrics:
|
| 591 |
+
value: false
|
| 592 |
+
log_unique_prompts:
|
| 593 |
+
value: false
|
| 594 |
+
logging_dir:
|
| 595 |
+
value: /mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/0416upload/out/qwen3asr_dapo_reward56_4x4x12_12gen_4GPU/v3-20260417-123227/runs
|
| 596 |
+
logging_first_step:
|
| 597 |
+
value: true
|
| 598 |
+
logging_nan_inf_filter:
|
| 599 |
+
value: true
|
| 600 |
+
logging_steps:
|
| 601 |
+
value: 5
|
| 602 |
+
logging_strategy:
|
| 603 |
+
value: steps
|
| 604 |
+
lora_rank:
|
| 605 |
+
value: 8
|
| 606 |
+
loss_type:
|
| 607 |
+
value: dapo
|
| 608 |
+
lr_scheduler_kwargs:
|
| 609 |
+
value: null
|
| 610 |
+
lr_scheduler_type:
|
| 611 |
+
value: cosine
|
| 612 |
+
mask_truncated_completions:
|
| 613 |
+
value: false
|
| 614 |
+
max_completion_length:
|
| 615 |
+
value: 256
|
| 616 |
+
max_epochs:
|
| 617 |
+
value: null
|
| 618 |
+
max_grad_norm:
|
| 619 |
+
value: 1
|
| 620 |
+
max_length:
|
| 621 |
+
value: 20
|
| 622 |
+
max_resample_times:
|
| 623 |
+
value: 4
|
| 624 |
+
max_shard_size:
|
| 625 |
+
value: 5GB
|
| 626 |
+
max_steps:
|
| 627 |
+
value: -1
|
| 628 |
+
max_tool_calling_iterations:
|
| 629 |
+
value: null
|
| 630 |
+
max_turns:
|
| 631 |
+
value: null
|
| 632 |
+
metric_for_best_model:
|
| 633 |
+
value: loss
|
| 634 |
+
min_length:
|
| 635 |
+
value: 0
|
| 636 |
+
min_p:
|
| 637 |
+
value: null
|
| 638 |
+
model/num_parameters:
|
| 639 |
+
value: 2050307712
|
| 640 |
+
model_init_kwargs:
|
| 641 |
+
value: null
|
| 642 |
+
model_type:
|
| 643 |
+
value: qwen3_asr
|
| 644 |
+
move_model_batches:
|
| 645 |
+
value: null
|
| 646 |
+
mp_parameters:
|
| 647 |
+
value: ""
|
| 648 |
+
multi_objective_aggregation:
|
| 649 |
+
value: sum_then_normalize
|
| 650 |
+
multi_turn_scheduler:
|
| 651 |
+
value: null
|
| 652 |
+
neftune_noise_alpha:
|
| 653 |
+
value: null
|
| 654 |
+
no_cuda:
|
| 655 |
+
value: false
|
| 656 |
+
no_repeat_ngram_size:
|
| 657 |
+
value: 0
|
| 658 |
+
num_beam_groups:
|
| 659 |
+
value: 1
|
| 660 |
+
num_beams:
|
| 661 |
+
value: 1
|
| 662 |
+
num_completions_to_print:
|
| 663 |
+
value: null
|
| 664 |
+
num_generations:
|
| 665 |
+
value: 12
|
| 666 |
+
num_generations_eval:
|
| 667 |
+
value: 4
|
| 668 |
+
num_iterations:
|
| 669 |
+
value: 2
|
| 670 |
+
num_return_sequences:
|
| 671 |
+
value: 1
|
| 672 |
+
num_train_epochs:
|
| 673 |
+
value: 3
|
| 674 |
+
off_policy_mask_threshold:
|
| 675 |
+
value: null
|
| 676 |
+
off_policy_sequence_mask_delta:
|
| 677 |
+
value: null
|
| 678 |
+
offload_model:
|
| 679 |
+
value: false
|
| 680 |
+
offload_optimizer:
|
| 681 |
+
value: false
|
| 682 |
+
optim:
|
| 683 |
+
value: adamw_torch
|
| 684 |
+
optim_args:
|
| 685 |
+
value: null
|
| 686 |
+
optim_target_modules:
|
| 687 |
+
value: null
|
| 688 |
+
optimizer:
|
| 689 |
+
value: null
|
| 690 |
+
output_attentions:
|
| 691 |
+
value: false
|
| 692 |
+
output_dir:
|
| 693 |
+
value: /mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/0416upload/out/qwen3asr_dapo_reward56_4x4x12_12gen_4GPU/v3-20260417-123227
|
| 694 |
+
output_hidden_states:
|
| 695 |
+
value: false
|
| 696 |
+
output_scores:
|
| 697 |
+
value: false
|
| 698 |
+
overlong_filter:
|
| 699 |
+
value: true
|
| 700 |
+
overwrite_output_dir:
|
| 701 |
+
value: false
|
| 702 |
+
pad_token_id:
|
| 703 |
+
value: 151643
|
| 704 |
+
parallelism_config:
|
| 705 |
+
value: null
|
| 706 |
+
past_index:
|
| 707 |
+
value: -1
|
| 708 |
+
peft_config:
|
| 709 |
+
value:
|
| 710 |
+
default:
|
| 711 |
+
alora_invocation_tokens: null
|
| 712 |
+
arrow_config: null
|
| 713 |
+
auto_mapping: null
|
| 714 |
+
base_model_name_or_path: /mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/qwen3-asr-merged
|
| 715 |
+
bias: none
|
| 716 |
+
corda_config: null
|
| 717 |
+
ensure_weight_tying: false
|
| 718 |
+
eva_config: null
|
| 719 |
+
exclude_modules: null
|
| 720 |
+
fan_in_fan_out: false
|
| 721 |
+
inference_mode: false
|
| 722 |
+
init_lora_weights: true
|
| 723 |
+
layer_replication: null
|
| 724 |
+
layers_pattern: null
|
| 725 |
+
layers_to_transform: null
|
| 726 |
+
lora_alpha: 32
|
| 727 |
+
lora_bias: false
|
| 728 |
+
lora_dropout: 0.05
|
| 729 |
+
lora_dtype: null
|
| 730 |
+
lorap_emb_lr: 1e-06
|
| 731 |
+
lorap_lr_ratio: null
|
| 732 |
+
megatron_config: null
|
| 733 |
+
megatron_core: megatron.core
|
| 734 |
+
modules_to_save: []
|
| 735 |
+
peft_type: LORA
|
| 736 |
+
peft_version: 0.18.1
|
| 737 |
+
qalora_group_size: 16
|
| 738 |
+
r: 8
|
| 739 |
+
revision: null
|
| 740 |
+
runtime_config:
|
| 741 |
+
ephemeral_gpu_offload: false
|
| 742 |
+
target_modules: ^(thinker\.model(?=\.).*\.(up_proj|v_proj|k_proj|o_proj|q_proj|gate_proj|down_proj)|thinker\.audio_tower\.layers(?=\.).*\.(v_proj|fc2|k_proj|fc1|q_proj|out_proj)|thinker\.audio_tower\.conv_out(?=\.)|thinker\.audio_tower\.proj1(?=\.)|thinker\.audio_tower\.proj2(?=\.))$
|
| 743 |
+
target_parameters: null
|
| 744 |
+
task_type: CAUSAL_LM
|
| 745 |
+
trainable_token_indices: null
|
| 746 |
+
use_dora: false
|
| 747 |
+
use_qalora: false
|
| 748 |
+
use_rslora: false
|
| 749 |
+
per_device_eval_batch_size:
|
| 750 |
+
value: 8
|
| 751 |
+
per_device_train_batch_size:
|
| 752 |
+
value: 8
|
| 753 |
+
per_gpu_eval_batch_size:
|
| 754 |
+
value: null
|
| 755 |
+
per_gpu_train_batch_size:
|
| 756 |
+
value: null
|
| 757 |
+
prediction_loss_only:
|
| 758 |
+
value: false
|
| 759 |
+
prefix:
|
| 760 |
+
value: null
|
| 761 |
+
problem_type:
|
| 762 |
+
value: null
|
| 763 |
+
project:
|
| 764 |
+
value: huggingface
|
| 765 |
+
push_to_hub:
|
| 766 |
+
value: false
|
| 767 |
+
push_to_hub_model_id:
|
| 768 |
+
value: null
|
| 769 |
+
push_to_hub_organization:
|
| 770 |
+
value: null
|
| 771 |
+
push_to_hub_token:
|
| 772 |
+
value: <PUSH_TO_HUB_TOKEN>
|
| 773 |
+
ray_scope:
|
| 774 |
+
value: last
|
| 775 |
+
ref_model_mixup_alpha:
|
| 776 |
+
value: 0.6
|
| 777 |
+
ref_model_sync_steps:
|
| 778 |
+
value: 512
|
| 779 |
+
remove_invalid_values:
|
| 780 |
+
value: false
|
| 781 |
+
remove_unused_columns:
|
| 782 |
+
value: false
|
| 783 |
+
repetition_max_penalty:
|
| 784 |
+
value: -1
|
| 785 |
+
repetition_n_grams:
|
| 786 |
+
value: 3
|
| 787 |
+
repetition_penalty:
|
| 788 |
+
value: 1.08
|
| 789 |
+
report_to:
|
| 790 |
+
value:
|
| 791 |
+
- wandb
|
| 792 |
+
restore_callback_states_from_checkpoint:
|
| 793 |
+
value: false
|
| 794 |
+
resume_from_checkpoint:
|
| 795 |
+
value: null
|
| 796 |
+
resume_only_model:
|
| 797 |
+
value: false
|
| 798 |
+
return_dict:
|
| 799 |
+
value: true
|
| 800 |
+
return_dict_in_generate:
|
| 801 |
+
value: false
|
| 802 |
+
reward_model:
|
| 803 |
+
value: null
|
| 804 |
+
reward_model_plugin:
|
| 805 |
+
value: null
|
| 806 |
+
reward_weights:
|
| 807 |
+
value: null
|
| 808 |
+
rollout_importance_sampling_mode:
|
| 809 |
+
value: null
|
| 810 |
+
rollout_importance_sampling_threshold:
|
| 811 |
+
value: 2
|
| 812 |
+
router_aux_loss_coef:
|
| 813 |
+
value: 0
|
| 814 |
+
run_name:
|
| 815 |
+
value: qwen3asr_dapo_reward56_4x4x12_12gen_4GPU
|
| 816 |
+
safe_serialization:
|
| 817 |
+
value: true
|
| 818 |
+
sapo_temperature_neg:
|
| 819 |
+
value: 1.05
|
| 820 |
+
sapo_temperature_pos:
|
| 821 |
+
value: 1
|
| 822 |
+
save_on_each_node:
|
| 823 |
+
value: false
|
| 824 |
+
save_only_model:
|
| 825 |
+
value: false
|
| 826 |
+
save_safetensors:
|
| 827 |
+
value: true
|
| 828 |
+
save_steps:
|
| 829 |
+
value: 20
|
| 830 |
+
save_strategy:
|
| 831 |
+
value: steps
|
| 832 |
+
save_total_limit:
|
| 833 |
+
value: null
|
| 834 |
+
scale_rewards:
|
| 835 |
+
value: group
|
| 836 |
+
seed:
|
| 837 |
+
value: 42
|
| 838 |
+
sep_token_id:
|
| 839 |
+
value: null
|
| 840 |
+
shuffle_dataset:
|
| 841 |
+
value: true
|
| 842 |
+
skip_memory_metrics:
|
| 843 |
+
value: true
|
| 844 |
+
sleep_level:
|
| 845 |
+
value: 0
|
| 846 |
+
soft_cache_length:
|
| 847 |
+
value: null
|
| 848 |
+
soft_max_length:
|
| 849 |
+
value: null
|
| 850 |
+
steps_per_generation:
|
| 851 |
+
value: 3
|
| 852 |
+
stop_words:
|
| 853 |
+
value: []
|
| 854 |
+
structured_outputs_regex:
|
| 855 |
+
value: null
|
| 856 |
+
support_languages:
|
| 857 |
+
value:
|
| 858 |
+
- Chinese
|
| 859 |
+
- English
|
| 860 |
+
- Cantonese
|
| 861 |
+
- Arabic
|
| 862 |
+
- German
|
| 863 |
+
- French
|
| 864 |
+
- Spanish
|
| 865 |
+
- Portuguese
|
| 866 |
+
- Indonesian
|
| 867 |
+
- Italian
|
| 868 |
+
- Korean
|
| 869 |
+
- Russian
|
| 870 |
+
- Thai
|
| 871 |
+
- Vietnamese
|
| 872 |
+
- Japanese
|
| 873 |
+
- Turkish
|
| 874 |
+
- Hindi
|
| 875 |
+
- Malay
|
| 876 |
+
- Dutch
|
| 877 |
+
- Swedish
|
| 878 |
+
- Danish
|
| 879 |
+
- Finnish
|
| 880 |
+
- Polish
|
| 881 |
+
- Czech
|
| 882 |
+
- Filipino
|
| 883 |
+
- Persian
|
| 884 |
+
- Greek
|
| 885 |
+
- Romanian
|
| 886 |
+
- Hungarian
|
| 887 |
+
- Macedonian
|
| 888 |
+
suppress_tokens:
|
| 889 |
+
value: null
|
| 890 |
+
sync_ref_model:
|
| 891 |
+
value: false
|
| 892 |
+
task_specific_params:
|
| 893 |
+
value: null
|
| 894 |
+
tau_neg:
|
| 895 |
+
value: 1.05
|
| 896 |
+
tau_pos:
|
| 897 |
+
value: 1
|
| 898 |
+
temperature:
|
| 899 |
+
value: 0.5
|
| 900 |
+
tf_legacy_loss:
|
| 901 |
+
value: false
|
| 902 |
+
tf32:
|
| 903 |
+
value: null
|
| 904 |
+
thinker_config:
|
| 905 |
+
value:
|
| 906 |
+
_name_or_path: ""
|
| 907 |
+
add_cross_attention: false
|
| 908 |
+
architectures:
|
| 909 |
+
- Qwen3ASRForConditionalGeneration
|
| 910 |
+
audio_config:
|
| 911 |
+
_name_or_path: ""
|
| 912 |
+
activation_dropout: 0
|
| 913 |
+
activation_function: gelu
|
| 914 |
+
add_cross_attention: false
|
| 915 |
+
architectures: null
|
| 916 |
+
attention_dropout: 0
|
| 917 |
+
bad_words_ids: null
|
| 918 |
+
begin_suppress_tokens: null
|
| 919 |
+
bos_token_id: null
|
| 920 |
+
chunk_size_feed_forward: 0
|
| 921 |
+
conv_chunksize: 500
|
| 922 |
+
cross_attention_hidden_size: null
|
| 923 |
+
d_model: 1024
|
| 924 |
+
decoder_start_token_id: null
|
| 925 |
+
diversity_penalty: 0
|
| 926 |
+
do_sample: false
|
| 927 |
+
downsample_hidden_size: 480
|
| 928 |
+
dropout: 0
|
| 929 |
+
dtype: null
|
| 930 |
+
early_stopping: false
|
| 931 |
+
encoder_attention_heads: 16
|
| 932 |
+
encoder_ffn_dim: 4096
|
| 933 |
+
encoder_layers: 24
|
| 934 |
+
encoder_no_repeat_ngram_size: 0
|
| 935 |
+
eos_token_id: null
|
| 936 |
+
exponential_decay_length_penalty: null
|
| 937 |
+
finetuning_task: null
|
| 938 |
+
forced_bos_token_id: null
|
| 939 |
+
forced_eos_token_id: null
|
| 940 |
+
id2label:
|
| 941 |
+
"0": LABEL_0
|
| 942 |
+
"1": LABEL_1
|
| 943 |
+
initializer_range: 0.02
|
| 944 |
+
is_decoder: false
|
| 945 |
+
is_encoder_decoder: false
|
| 946 |
+
label2id:
|
| 947 |
+
LABEL_0: 0
|
| 948 |
+
LABEL_1: 1
|
| 949 |
+
length_penalty: 1
|
| 950 |
+
max_length: 20
|
| 951 |
+
max_source_positions: 1500
|
| 952 |
+
min_length: 0
|
| 953 |
+
model_type: qwen3_asr_audio_encoder
|
| 954 |
+
n_window: 50
|
| 955 |
+
n_window_infer: 800
|
| 956 |
+
no_repeat_ngram_size: 0
|
| 957 |
+
num_beam_groups: 1
|
| 958 |
+
num_beams: 1
|
| 959 |
+
num_hidden_layers: 24
|
| 960 |
+
num_mel_bins: 128
|
| 961 |
+
num_return_sequences: 1
|
| 962 |
+
output_attentions: false
|
| 963 |
+
output_dim: 2048
|
| 964 |
+
output_hidden_states: false
|
| 965 |
+
output_scores: false
|
| 966 |
+
pad_token_id: null
|
| 967 |
+
prefix: null
|
| 968 |
+
problem_type: null
|
| 969 |
+
remove_invalid_values: false
|
| 970 |
+
repetition_penalty: 1
|
| 971 |
+
return_dict: true
|
| 972 |
+
return_dict_in_generate: false
|
| 973 |
+
scale_embedding: false
|
| 974 |
+
sep_token_id: null
|
| 975 |
+
suppress_tokens: null
|
| 976 |
+
task_specific_params: null
|
| 977 |
+
temperature: 1
|
| 978 |
+
tf_legacy_loss: false
|
| 979 |
+
tie_encoder_decoder: false
|
| 980 |
+
tie_word_embeddings: true
|
| 981 |
+
tokenizer_class: null
|
| 982 |
+
top_k: 50
|
| 983 |
+
top_p: 1
|
| 984 |
+
torchscript: false
|
| 985 |
+
typical_p: 1
|
| 986 |
+
use_bfloat16: false
|
| 987 |
+
audio_end_token_id: 151670
|
| 988 |
+
audio_start_token_id: 151669
|
| 989 |
+
audio_token_id: 151676
|
| 990 |
+
bad_words_ids: null
|
| 991 |
+
begin_suppress_tokens: null
|
| 992 |
+
bos_token_id: null
|
| 993 |
+
chunk_size_feed_forward: 0
|
| 994 |
+
cross_attention_hidden_size: null
|
| 995 |
+
decoder_start_token_id: null
|
| 996 |
+
diversity_penalty: 0
|
| 997 |
+
do_sample: false
|
| 998 |
+
dtype: bfloat16
|
| 999 |
+
early_stopping: false
|
| 1000 |
+
encoder_no_repeat_ngram_size: 0
|
| 1001 |
+
eos_token_id: null
|
| 1002 |
+
exponential_decay_length_penalty: null
|
| 1003 |
+
finetuning_task: null
|
| 1004 |
+
forced_bos_token_id: null
|
| 1005 |
+
forced_eos_token_id: null
|
| 1006 |
+
id2label:
|
| 1007 |
+
"0": LABEL_0
|
| 1008 |
+
"1": LABEL_1
|
| 1009 |
+
initializer_range: 0.02
|
| 1010 |
+
is_decoder: false
|
| 1011 |
+
is_encoder_decoder: false
|
| 1012 |
+
label2id:
|
| 1013 |
+
LABEL_0: 0
|
| 1014 |
+
LABEL_1: 1
|
| 1015 |
+
length_penalty: 1
|
| 1016 |
+
max_length: 20
|
| 1017 |
+
min_length: 0
|
| 1018 |
+
model_type: qwen3_asr_thinker
|
| 1019 |
+
no_repeat_ngram_size: 0
|
| 1020 |
+
num_beam_groups: 1
|
| 1021 |
+
num_beams: 1
|
| 1022 |
+
num_return_sequences: 1
|
| 1023 |
+
output_attentions: false
|
| 1024 |
+
output_hidden_states: false
|
| 1025 |
+
output_scores: false
|
| 1026 |
+
pad_token_id: null
|
| 1027 |
+
prefix: null
|
| 1028 |
+
problem_type: null
|
| 1029 |
+
remove_invalid_values: false
|
| 1030 |
+
repetition_penalty: 1
|
| 1031 |
+
return_dict: true
|
| 1032 |
+
return_dict_in_generate: false
|
| 1033 |
+
sep_token_id: null
|
| 1034 |
+
suppress_tokens: null
|
| 1035 |
+
task_specific_params: null
|
| 1036 |
+
temperature: 1
|
| 1037 |
+
text_config:
|
| 1038 |
+
_name_or_path: ""
|
| 1039 |
+
add_cross_attention: false
|
| 1040 |
+
architectures: null
|
| 1041 |
+
attention_bias: false
|
| 1042 |
+
attention_dropout: 0
|
| 1043 |
+
bad_words_ids: null
|
| 1044 |
+
begin_suppress_tokens: null
|
| 1045 |
+
bos_token_id: null
|
| 1046 |
+
chunk_size_feed_forward: 0
|
| 1047 |
+
cross_attention_hidden_size: null
|
| 1048 |
+
decoder_start_token_id: null
|
| 1049 |
+
diversity_penalty: 0
|
| 1050 |
+
do_sample: false
|
| 1051 |
+
dtype: null
|
| 1052 |
+
early_stopping: false
|
| 1053 |
+
encoder_no_repeat_ngram_size: 0
|
| 1054 |
+
eos_token_id: null
|
| 1055 |
+
exponential_decay_length_penalty: null
|
| 1056 |
+
finetuning_task: null
|
| 1057 |
+
forced_bos_token_id: null
|
| 1058 |
+
forced_eos_token_id: null
|
| 1059 |
+
head_dim: 128
|
| 1060 |
+
hidden_act: silu
|
| 1061 |
+
hidden_size: 2048
|
| 1062 |
+
id2label:
|
| 1063 |
+
"0": LABEL_0
|
| 1064 |
+
"1": LABEL_1
|
| 1065 |
+
initializer_range: 0.02
|
| 1066 |
+
intermediate_size: 6144
|
| 1067 |
+
is_decoder: false
|
| 1068 |
+
is_encoder_decoder: false
|
| 1069 |
+
label2id:
|
| 1070 |
+
LABEL_0: 0
|
| 1071 |
+
LABEL_1: 1
|
| 1072 |
+
length_penalty: 1
|
| 1073 |
+
max_length: 20
|
| 1074 |
+
max_position_embeddings: 65536
|
| 1075 |
+
min_length: 0
|
| 1076 |
+
model_type: qwen3_asr_text
|
| 1077 |
+
no_repeat_ngram_size: 0
|
| 1078 |
+
num_attention_heads: 16
|
| 1079 |
+
num_beam_groups: 1
|
| 1080 |
+
num_beams: 1
|
| 1081 |
+
num_hidden_layers: 28
|
| 1082 |
+
num_key_value_heads: 8
|
| 1083 |
+
num_return_sequences: 1
|
| 1084 |
+
output_attentions: false
|
| 1085 |
+
output_hidden_states: false
|
| 1086 |
+
output_scores: false
|
| 1087 |
+
pad_token_id: 151643
|
| 1088 |
+
prefix: null
|
| 1089 |
+
problem_type: null
|
| 1090 |
+
remove_invalid_values: false
|
| 1091 |
+
repetition_penalty: 1
|
| 1092 |
+
return_dict: true
|
| 1093 |
+
return_dict_in_generate: false
|
| 1094 |
+
rms_norm_eps: 1e-06
|
| 1095 |
+
rope_scaling:
|
| 1096 |
+
interleaved: true
|
| 1097 |
+
mrope_interleaved: true
|
| 1098 |
+
mrope_section:
|
| 1099 |
+
- 24
|
| 1100 |
+
- 20
|
| 1101 |
+
- 20
|
| 1102 |
+
rope_type: default
|
| 1103 |
+
type: default
|
| 1104 |
+
rope_theta: 1000000
|
| 1105 |
+
sep_token_id: null
|
| 1106 |
+
suppress_tokens: null
|
| 1107 |
+
task_specific_params: null
|
| 1108 |
+
temperature: 1
|
| 1109 |
+
tf_legacy_loss: false
|
| 1110 |
+
tie_encoder_decoder: false
|
| 1111 |
+
tie_word_embeddings: true
|
| 1112 |
+
tokenizer_class: null
|
| 1113 |
+
top_k: 50
|
| 1114 |
+
top_p: 1
|
| 1115 |
+
torchscript: false
|
| 1116 |
+
typical_p: 1
|
| 1117 |
+
use_bfloat16: false
|
| 1118 |
+
use_cache: false
|
| 1119 |
+
vocab_size: 151936
|
| 1120 |
+
tf_legacy_loss: false
|
| 1121 |
+
tie_encoder_decoder: false
|
| 1122 |
+
tie_word_embeddings: true
|
| 1123 |
+
tokenizer_class: null
|
| 1124 |
+
top_k: 50
|
| 1125 |
+
top_p: 1
|
| 1126 |
+
torchscript: false
|
| 1127 |
+
typical_p: 1
|
| 1128 |
+
use_bfloat16: false
|
| 1129 |
+
user_token_id: 872
|
| 1130 |
+
tie_encoder_decoder:
|
| 1131 |
+
value: false
|
| 1132 |
+
tie_word_embeddings:
|
| 1133 |
+
value: true
|
| 1134 |
+
tokenizer_class:
|
| 1135 |
+
value: null
|
| 1136 |
+
top_entropy_quantile:
|
| 1137 |
+
value: 1
|
| 1138 |
+
top_k:
|
| 1139 |
+
value: 50
|
| 1140 |
+
top_p:
|
| 1141 |
+
value: 0.95
|
| 1142 |
+
torch_compile:
|
| 1143 |
+
value: false
|
| 1144 |
+
torch_compile_backend:
|
| 1145 |
+
value: null
|
| 1146 |
+
torch_compile_mode:
|
| 1147 |
+
value: null
|
| 1148 |
+
torch_empty_cache_steps:
|
| 1149 |
+
value: null
|
| 1150 |
+
torchdynamo:
|
| 1151 |
+
value: null
|
| 1152 |
+
torchscript:
|
| 1153 |
+
value: false
|
| 1154 |
+
tpu_metrics_debug:
|
| 1155 |
+
value: false
|
| 1156 |
+
tpu_num_cores:
|
| 1157 |
+
value: null
|
| 1158 |
+
trackio_space_id:
|
| 1159 |
+
value: trackio
|
| 1160 |
+
train_dataloader_shuffle:
|
| 1161 |
+
value: true
|
| 1162 |
+
transformers_version:
|
| 1163 |
+
value: 4.57.6
|
| 1164 |
+
tuner_backend:
|
| 1165 |
+
value: peft
|
| 1166 |
+
tuner_type:
|
| 1167 |
+
value: lora
|
| 1168 |
+
typical_p:
|
| 1169 |
+
value: 1
|
| 1170 |
+
use_bfloat16:
|
| 1171 |
+
value: false
|
| 1172 |
+
use_bias_correction_kl:
|
| 1173 |
+
value: false
|
| 1174 |
+
use_cpu:
|
| 1175 |
+
value: false
|
| 1176 |
+
use_flash_ckpt:
|
| 1177 |
+
value: false
|
| 1178 |
+
use_galore:
|
| 1179 |
+
value: false
|
| 1180 |
+
use_legacy_prediction_loop:
|
| 1181 |
+
value: false
|
| 1182 |
+
use_liger_kernel:
|
| 1183 |
+
value: false
|
| 1184 |
+
use_logits_to_keep:
|
| 1185 |
+
value: null
|
| 1186 |
+
use_mps_device:
|
| 1187 |
+
value: false
|
| 1188 |
+
use_transformers_paged:
|
| 1189 |
+
value: false
|
| 1190 |
+
use_vllm:
|
| 1191 |
+
value: false
|
| 1192 |
+
vit_gradient_checkpointing:
|
| 1193 |
+
value: true
|
| 1194 |
+
vit_lr:
|
| 1195 |
+
value: null
|
| 1196 |
+
vllm_data_parallel_size:
|
| 1197 |
+
value: 1
|
| 1198 |
+
vllm_disable_cascade_attn:
|
| 1199 |
+
value: false
|
| 1200 |
+
vllm_disable_custom_all_reduce:
|
| 1201 |
+
value: true
|
| 1202 |
+
vllm_enable_expert_parallel:
|
| 1203 |
+
value: false
|
| 1204 |
+
vllm_enable_lora:
|
| 1205 |
+
value: false
|
| 1206 |
+
vllm_enable_prefix_caching:
|
| 1207 |
+
value: true
|
| 1208 |
+
vllm_enable_sleep_mode:
|
| 1209 |
+
value: false
|
| 1210 |
+
vllm_enforce_eager:
|
| 1211 |
+
value: false
|
| 1212 |
+
vllm_gpu_memory_utilization:
|
| 1213 |
+
value: 0.9
|
| 1214 |
+
vllm_group_port:
|
| 1215 |
+
value: 51216
|
| 1216 |
+
vllm_importance_sampling_cap:
|
| 1217 |
+
value: 3
|
| 1218 |
+
vllm_importance_sampling_correction:
|
| 1219 |
+
value: true
|
| 1220 |
+
vllm_importance_sampling_mode:
|
| 1221 |
+
value: sequence_mask
|
| 1222 |
+
vllm_limit_mm_per_prompt:
|
| 1223 |
+
value: null
|
| 1224 |
+
vllm_max_lora_rank:
|
| 1225 |
+
value: 16
|
| 1226 |
+
vllm_max_model_len:
|
| 1227 |
+
value: null
|
| 1228 |
+
vllm_max_model_length:
|
| 1229 |
+
value: null
|
| 1230 |
+
vllm_max_num_seqs:
|
| 1231 |
+
value: null
|
| 1232 |
+
vllm_mm_processor_cache_gb:
|
| 1233 |
+
value: null
|
| 1234 |
+
vllm_mode:
|
| 1235 |
+
value: null
|
| 1236 |
+
vllm_model_impl:
|
| 1237 |
+
value: vllm
|
| 1238 |
+
vllm_pipeline_parallel_size:
|
| 1239 |
+
value: 1
|
| 1240 |
+
vllm_quantization:
|
| 1241 |
+
value: null
|
| 1242 |
+
vllm_reasoning_parser:
|
| 1243 |
+
value: null
|
| 1244 |
+
vllm_server_base_url:
|
| 1245 |
+
value: null
|
| 1246 |
+
vllm_server_group_port:
|
| 1247 |
+
value: null
|
| 1248 |
+
vllm_server_host:
|
| 1249 |
+
value: null
|
| 1250 |
+
vllm_server_pass_dataset:
|
| 1251 |
+
value: false
|
| 1252 |
+
vllm_server_port:
|
| 1253 |
+
value:
|
| 1254 |
+
- 8000
|
| 1255 |
+
vllm_server_timeout:
|
| 1256 |
+
value: 240
|
| 1257 |
+
vllm_speculative_config:
|
| 1258 |
+
value: null
|
| 1259 |
+
vllm_structured_outputs_regex:
|
| 1260 |
+
value: null
|
| 1261 |
+
vllm_tensor_parallel_size:
|
| 1262 |
+
value: 1
|
| 1263 |
+
vllm_use_async_engine:
|
| 1264 |
+
value: null
|
| 1265 |
+
wandb_log_unique_prompts:
|
| 1266 |
+
value: null
|
| 1267 |
+
warmup_ratio:
|
| 1268 |
+
value: 0.03
|
| 1269 |
+
warmup_steps:
|
| 1270 |
+
value: 0
|
| 1271 |
+
weight_decay:
|
| 1272 |
+
value: 0.1
|
wandb/run-20260417_123237-3h84yfea/files/media/table/completions_1_e5129c1db5b8522d8aa7.table.json
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"columns": ["step", "prompt", "completion", "ASRWerSubLenCmpHalluDirtyV56", "advantages", "solution"], "data": [["1", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>The reverend recteur passed his hand wearily over his brow, a hill with a faint memory of running upstairs so quickly. We never touched the beastly box. The doctor then your competitor did said missus nelly no no said the curate hastily.<|im_end|>", -0.1968451738357544, -0.8322931528091431, "The reverend septimus passed his hand wearily over his brow. I feel a little faint, he said, running upstairs so quickly, we never touched the beastly box, said robert. Then your confederates did said miss selina. No, no, said the curate hastily."], ["1", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>The reverend rectory passed his hand wearily over his brow a hill and a faint misty morning upstairs, he said we never touched the beastly box then your competitor did said missus nixon no no said the curate hastily.<|im_end|>", -0.37275323271751404, -2.000243663787842, "The reverend septimus passed his hand wearily over his brow. I feel a little faint, he said, running upstairs so quickly, we never touched the beastly box, said robert. Then your confederates did said miss selina. No, no, said the curate hastily."], ["1", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>The reverend recteur passed his hand wearily over his brow a hill wind of faintness has been running upstairs so lately, we never touched the beastly box said the vicar then your competitor did said missus neil no no said the curate hastily.<|im_end|>", -0.174954354763031, -0.6869479417800903, "The reverend septimus passed his hand wearily over his brow. I feel a little faint, he said, running upstairs so quickly, we never touched the beastly box, said robert. Then your confederates did said miss selina. No, no, said the curate hastily."], ["1", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>The reverend recteur passed his hand wearily over his brow, a hillwood of faintness and running upstairs so quickly we never touched the beastly box said the vicar then your competitor's did said missus nelly no no said the curate hastily.<|im_end|>", -0.06302247941493988, 0.056229472160339355, "The reverend septimus passed his hand wearily over his brow. I feel a little faint, he said, running upstairs so quickly, we never touched the beastly box, said robert. Then your confederates did said miss selina. No, no, said the curate hastily."], ["1", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>The reverend rectors passed his hand wearily over his brow, I feel a little faint now for running upstairs so quickly. We never touched the beastly box said morris then your competitor did said missus merrithew no, no said the curate hastily.<|im_end|>", 0.24413266777992249, 2.0956015586853027, "The reverend septimus passed his hand wearily over his brow. I feel a little faint, he said, running upstairs so quickly, we never touched the beastly box, said robert. Then your confederates did said miss selina. No, no, said the curate hastily."], ["1", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>The reverend recteur passed his hand wearily over his brow a hill with a fainting man running upstairs so quickly, we never touched the beastly box said Robert and your competitor did said missus minton no no said the curate hastily.<|im_end|>", -0.09589200466871262, -0.16200941801071167, "The reverend septimus passed his hand wearily over his brow. I feel a little faint, he said, running upstairs so quickly, we never touched the beastly box, said robert. Then your confederates did said miss selina. No, no, said the curate hastily."], ["1", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>The reverend recteur passed his hand wearily over his brow a hill with a faint memory of running upstairs so quickly, we never touched the beastly box said the curate and your confederates did said missus mallet no no said the curate hastily.<|im_end|>", -0.09384658932685852, -0.1484287828207016, "The reverend septimus passed his hand wearily over his brow. I feel a little faint, he said, running upstairs so quickly, we never touched the beastly box, said robert. Then your confederates did said miss selina. No, no, said the curate hastily."], ["1", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>The reverend rectors passed his hand wearily over his brow a hill of saint nicholas went upstairs so quickly, we never touched the beastly box said robert then your competitor did said missus mink no no said the curate hastily.<|im_end|>", -0.005024942569434643, 0.44130709767341614, "The reverend septimus passed his hand wearily over his brow. I feel a little faint, he said, running upstairs so quickly, we never touched the beastly box, said robert. Then your confederates did said miss selina. No, no, said the curate hastily."], ["1", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>The reverend rectory passed his hand wearily over his brow a hillwood saint may be running upstairs so briskly, we never touched the beastly box said the curate and your competitor did said missus nelly no no said the curate hastily.<|im_end|>", -0.13762426376342773, -0.43909287452697754, "The reverend septimus passed his hand wearily over his brow. I feel a little faint, he said, running upstairs so quickly, we never touched the beastly box, said robert. Then your confederates did said miss selina. No, no, said the curate hastily."], ["1", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>The reverend recteur passed his hand wearily over his brow, I feel a little faint now that I am upstairs so quickly. We never touched the beastly box either than your competitor did said missus nelly no, no said the curate hastily.<|im_end|>", -0.004176640883088112, 0.4469394385814667, "The reverend septimus passed his hand wearily over his brow. I feel a little faint, he said, running upstairs so quickly, we never touched the beastly box, said robert. Then your confederates did said miss selina. No, no, said the curate hastily."], ["1", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>The reverend recteur passed his hand wearily over his brow a hill with a faint memory of running upstairs so quickly we never touched the beastly box said robert then your competitor did said missus nunn no, no, said the curate hastily.<|im_end|>", 0.04079977795481682, 0.7455626726150513, "The reverend septimus passed his hand wearily over his brow. I feel a little faint, he said, running upstairs so quickly, we never touched the beastly box, said robert. Then your confederates did said miss selina. No, no, said the curate hastily."], ["1", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>The reverend recteur passed his hand wearily over his brow a hill of faintness and running upstairs so quickly, we never touched the beastly box said robert then your competitor did said missus innes no no said the curate hastily<|im_end|>", 0.001311193685978651, 0.483376145362854, "The reverend septimus passed his hand wearily over his brow. I feel a little faint, he said, running upstairs so quickly, we never touched the beastly box, said robert. Then your confederates did said miss selina. No, no, said the curate hastily."], ["1", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>There was much amazement spread among her sister, that political aspects of the revolution in france changed almost every day she might not understand how his own views and sympathies might often modify them.<|im_end|>", -0.10891497135162354, -2.1773321628570557, "There was much armand saint just could not tell his sister the political aspect of the revolution in france was changing almost every day. She might not understand how his own views and sympathies might become modified."], ["1", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>There was much armagogy for my cousin's sister, the political aspect of the revolution in france changing almost every day. She might not understand how his own views and sympathies might be modified.<|im_end|>", 0.3462296724319458, 1.5272533893585205, "There was much armand saint just could not tell his sister the political aspect of the revolution in france was changing almost every day. She might not understand how his own views and sympathies might become modified."], ["1", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>There was much armagnac jokes with my cousin sister, the political aspect of the revolution in france changing almost every day she might not understand how his own views and sympathies might differ from mine.<|im_end|>", 0.11626709252595901, -0.34449443221092224, "There was much armand saint just could not tell his sister the political aspect of the revolution in france was changing almost every day. She might not understand how his own views and sympathies might become modified."], ["1", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>There was much armagnac jokes with my cousin sister, the political aspect of the revolution in france changing almost every day. She might not understand how his own views and sympathies might often modify.<|im_end|>", 0.257978618144989, 0.808946430683136, "There was much armand saint just could not tell his sister the political aspect of the revolution in france was changing almost every day. She might not understand how his own views and sympathies might become modified."], ["1", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>There was much amaranteuse about Parisian society, the political aspect of the revolution in France changing almost every day. She might not understand how his own views and sympathies might often modify her.<|im_end|>", 0.21243521571159363, 0.43825238943099976, "There was much armand saint just could not tell his sister the political aspect of the revolution in france was changing almost every day. She might not understand how his own views and sympathies might become modified."], ["1", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>There was much armagnac, jute and martell in his drink. The political aspect of the revolution is hence changing almost every day. She might not understand how his own views and sympathies might often modify it.<|im_end|>", 0.10369522124528885, -0.4468214213848114, "There was much armand saint just could not tell his sister the political aspect of the revolution in france was changing almost every day. She might not understand how his own views and sympathies might become modified."], ["1", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>There was much armaghajet for my cousin sister, the political aspect of the revolution in france changing almost every day she might not understand how his own views and sympathies might often modify them.<|im_end|>", 0.13262253999710083, -0.21137160062789917, "There was much armand saint just could not tell his sister the political aspect of the revolution in france was changing almost every day. She might not understand how his own views and sympathies might become modified."], ["1", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>There was much amarante jute for my traveling sister, the political aspect of the revolution in france changing almost every day she might not understand how his own views and sympathies might be modified.<|im_end|>", 0.26360028982162476, 0.8547032475471497, "There was much armand saint just could not tell his sister the political aspect of the revolution in france was changing almost every day. She might not understand how his own views and sympathies might become modified."], ["1", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>There was much armagnac yoked to my parent's estate, the political aspect of the revolution of france changing almost every day she might not understand how his own views and sympathies might be modified.<|im_end|>", 0.18032926321029663, 0.1769305318593979, "There was much armand saint just could not tell his sister the political aspect of the revolution in france was changing almost every day. She might not understand how his own views and sympathies might become modified."], ["1", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>There was much armance and jocund merrymaking there, but the political aspect of the revolution is hence changing almost every day. She might not understand how his own views and sympathies might often modify hers.<|im_end|>", 0.033820733428001404, -1.0155549049377441, "There was much armand saint just could not tell his sister the political aspect of the revolution in france was changing almost every day. She might not understand how his own views and sympathies might become modified."], ["1", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>There was much arme hautes in my town, sister. The political aspect of the revolution is hence changing almost every day. She might not understand how his own views and sympathies might often modify.<|im_end|>", 0.10335493087768555, -0.44959115982055664, "There was much armand saint just could not tell his sister the political aspect of the revolution in france was changing almost every day. She might not understand how his own views and sympathies might become modified."], ["1", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>There was much amazement spread among her sister, the political aspect of the revolution in france changing almost every day. She might not understand how his own views and sympathies might often modify.<|im_end|>", 0.26168063282966614, 0.8390784859657288, "There was much armand saint just could not tell his sister the political aspect of the revolution in france was changing almost every day. She might not understand how his own views and sympathies might become modified."], ["1", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Never prior to a public meeting that the order should be payable in any year and do bear interest of five per cent if these orders were disposed of provisionally at least would be purchased he seconded with very little hesitation adopted both orders were immediately printed<|im_end|>", -0.32611703872680664, -0.7204017639160156, "and therefore i propos'd that the orders should be payable in a year and to bear an interest of five per cent with these orders i suppos'd the provisions might easily be purchas'd the assembly with very little hesitation adopted the proposal the orders were immediately printed"], ["1", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Never provided for both that the order should be payable in any and do bearing interest of five per cent if these orders were to suppose provisions might easily be purchased is now with very little hesitation adopted both orders were immediately printed.<|im_end|>", -0.15472601354122162, 0.3779638409614563, "and therefore i propos'd that the orders should be payable in a year and to bear an interest of five per cent with these orders i suppos'd the provisions might easily be purchas'd the assembly with very little hesitation adopted the proposal the orders were immediately printed"], ["1", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Never prior to public opinion that the order should be payable in a year and do bear an interest of five per cent if these orders were disposed of provisionally at least would be purchased he said with very little hesitation adopting both orders were immediately printed.<|im_end|>", -0.28605878353118896, -0.4636869728565216, "and therefore i propos'd that the orders should be payable in a year and to bear an interest of five per cent with these orders i suppos'd the provisions might easily be purchas'd the assembly with very little hesitation adopted the proposal the orders were immediately printed"], ["1", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Never prior, but once that they ordered it should be payable in England and do bear an interest of five per cent if these orders were disposed of provisionally at least would be purchased he said with very little hesitation adopted both orders were immediately printed.<|im_end|>", -0.4090765416622162, -1.252050757408142, "and therefore i propos'd that the orders should be payable in a year and to bear an interest of five per cent with these orders i suppos'd the provisions might easily be purchas'd the assembly with very little hesitation adopted the proposal the orders were immediately printed"], ["1", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Never cried out boldly that the order should be payable in England and do bearing interest five per cent, if these orders were disposed of provisionally at least would be purchased. His nephew with very little hesitation adopted both orders were immediately printed.<|im_end|>", -0.5401909947395325, -2.0923023223876953, "and therefore i propos'd that the orders should be payable in a year and to bear an interest of five per cent with these orders i suppos'd the provisions might easily be purchas'd the assembly with very little hesitation adopted the proposal the orders were immediately printed"], ["1", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Never, prior to published that they ordered it should be payable in a year and do bear an interest of five per cent if these orders were disposed of provisions might easily be purchased he snapped with very little hesitation adopted both orders were immediately printed.<|im_end|>", -0.031015297397971153, 1.1707684993743896, "and therefore i propos'd that the orders should be payable in a year and to bear an interest of five per cent with these orders i suppos'd the provisions might easily be purchas'd the assembly with very little hesitation adopted the proposal the orders were immediately printed"], ["1", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Never prior to public debate that the order should be payable in any year and to bear an interest of five per cent, if these orders were supposed provisionists might easily be purchased. His cabinet with very little hesitation adopted both orders were immediately granted.<|im_end|>", -0.08785741031169891, 0.8064936995506287, "and therefore i propos'd that the orders should be payable in a year and to bear an interest of five per cent with these orders i suppos'd the provisions might easily be purchas'd the assembly with very little hesitation adopted the proposal the orders were immediately printed"], ["1", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Never prior to public opinion that the order should be payable in England and do bear an interest of five per cent if these orders were supposed provisionally easy to be purchased, this act with very little hesitation adopted them both orders were immediately printed.<|im_end|>", -0.2863375246524811, -0.4654732942581177, "and therefore i propos'd that the orders should be payable in a year and to bear an interest of five per cent with these orders i suppos'd the provisions might easily be purchas'd the assembly with very little hesitation adopted the proposal the orders were immediately printed"], ["1", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Never, privateer boat. That they ordered should be payable in England and do bear interest of five per cent that these orders might suppose the provisions might easily be purchased he seconded with very little hesitation adopted both orders were immediately printed.<|im_end|>", -0.09660232812166214, 0.7504515647888184, "and therefore i propos'd that the orders should be payable in a year and to bear an interest of five per cent with these orders i suppos'd the provisions might easily be purchas'd the assembly with very little hesitation adopted the proposal the orders were immediately printed"], ["1", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Never, prior or above that they ordered should be payable in a year and to bear an interest of five per cent if these orders were disposed of provisionally at least would be purchased his nephew with very little hesitation adopted both orders were immediately granted<|im_end|>", -0.16866184771060944, 0.28865551948547363, "and therefore i propos'd that the orders should be payable in a year and to bear an interest of five per cent with these orders i suppos'd the provisions might easily be purchas'd the assembly with very little hesitation adopted the proposal the orders were immediately printed"], ["1", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Never prior to published that the order should be payable in any and do bear an interest of five per cent, if these orders were supposed provisions might easily be purchased he seconded with very little hesitation adopted both orders were immediately printed.<|im_end|>", -0.08984959125518799, 0.7937267422676086, "and therefore i propos'd that the orders should be payable in a year and to bear an interest of five per cent with these orders i suppos'd the provisions might easily be purchas'd the assembly with very little hesitation adopted the proposal the orders were immediately printed"], ["1", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Never, prior to public debate that the order should be payable in England and do bear an interest of five per cent. That these orders would suppose the provisions might easily be purchased. His cabinet with very little hesitation adopted both orders were immediately printed.<|im_end|>", -0.08795680850744247, 0.8058566451072693, "and therefore i propos'd that the orders should be payable in a year and to bear an interest of five per cent with these orders i suppos'd the provisions might easily be purchas'd the assembly with very little hesitation adopted the proposal the orders were immediately printed"], ["1", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>As his trumpet blast sounded forth, he said, the free folk of all that hill give a cheap word and warning that they will fight against you when you come. To her own side came back this ringing reply as the knight rode up with many and fierce assailants.<|im_end|>", -0.7235177755355835, -0.37753382325172424, "Herald of arkell. As his trumpet blast sounded before the gate of the citadel, the free lord of arkell here giveth you word and warning that he will fight against you on the morrow. And from the citadel came back this ringing reply, as the knight of leyenburg made answer for his sovereign lady."], ["1", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>As his trumpet blast sounded over the hill, the three lords of alba heard it and warned and warning at him to fight against you on your mountain. From whence he came back this ringing reply as a knightly lord might answer in such a manner.<|im_end|>", -0.7205132842063904, -0.3610304296016693, "Herald of arkell. As his trumpet blast sounded before the gate of the citadel, the free lord of arkell here giveth you word and warning that he will fight against you on the morrow. And from the citadel came back this ringing reply, as the knight of leyenburg made answer for his sovereign lady."], ["1", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>As his trumpet blast sounded over the open field, the three lord larker here give it you word and warning that he will fight against you on your mountain from whence now came back this ringing reply of the knight in yellow with mallet and scimitar in hand.<|im_end|>", -0.4105190336704254, 1.3417396545410156, "Herald of arkell. As his trumpet blast sounded before the gate of the citadel, the free lord of arkell here giveth you word and warning that he will fight against you on the morrow. And from the citadel came back this ringing reply, as the knight of leyenburg made answer for his sovereign lady."], ["1", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>As his trumpet blast sounded in the open air, the three four walked out and he gave a deep wordy warning that he would fight against you when you met him. And from the hill came back this ringing reply as the knight who had but lately entered the city wall.<|im_end|>", -0.6633491516113281, -0.04703306034207344, "Herald of arkell. As his trumpet blast sounded before the gate of the citadel, the free lord of arkell here giveth you word and warning that he will fight against you on the morrow. And from the citadel came back this ringing reply, as the knight of leyenburg made answer for his sovereign lady."], ["1", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>As his trumpet blast sounded over the hills, the three lords of Argor hear give a deep word and warning that they will fight against you when you come. And from these lips came back this ringing reply as the knight who had brought my answer disappeared again.<|im_end|>", -0.533552348613739, 0.6659289002418518, "Herald of arkell. As his trumpet blast sounded before the gate of the citadel, the free lord of arkell here giveth you word and warning that he will fight against you on the morrow. And from the citadel came back this ringing reply, as the knight of leyenburg made answer for his sovereign lady."], ["1", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>As his trumpet blast sounded forth, he said, the three lords of algalhia give a few word and warning that they will fight against you on your mountain when the messenger came back with screaming reply that the knight had been overtaken by the sons of the sea.<|im_end|>", -0.7495418190956116, -0.520481526851654, "Herald of arkell. As his trumpet blast sounded before the gate of the citadel, the free lord of arkell here giveth you word and warning that he will fight against you on the morrow. And from the citadel came back this ringing reply, as the knight of leyenburg made answer for his sovereign lady."], ["1", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>As his trumpet blast sounded forth, he cried, the free folk of all great hill give us your word and warning that you will fight against you no more from whose lips came back this ringing reply as the knight who had brought my answer was singing aloud.<|im_end|>", -0.6600818634033203, -0.029086142778396606, "Herald of arkell. As his trumpet blast sounded before the gate of the citadel, the free lord of arkell here giveth you word and warning that he will fight against you on the morrow. And from the citadel came back this ringing reply, as the knight of leyenburg made answer for his sovereign lady."], ["1", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>As his trumpet blast sounded through the air, he said, the three lords of all that hill give a chief warning warning that he will fight against you when the night is done with my engines and the sun goes down.<|im_end|>", -0.9883988499641418, -1.8325012922286987, "Herald of arkell. As his trumpet blast sounded before the gate of the citadel, the free lord of arkell here giveth you word and warning that he will fight against you on the morrow. And from the citadel came back this ringing reply, as the knight of leyenburg made answer for his sovereign lady."], ["1", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>As his trumpet blast sounded over, he cried, the free born far from here give a cheap word and warning that he will fight against you when you know it, but from the hills came back this ringing reply of the knight who had heard my legend and was singing along.<|im_end|>", -0.6016453504562378, 0.29190027713775635, "Herald of arkell. As his trumpet blast sounded before the gate of the citadel, the free lord of arkell here giveth you word and warning that he will fight against you on the morrow. And from the citadel came back this ringing reply, as the knight of leyenburg made answer for his sovereign lady."], ["1", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>As his trumpet blast sounded forth, he said the three lords of Argyle give a cheap word and warning that they will fight against you on the morrow. From his lips came back this ringing reply as the knight rode up with my lady and her sister in their arms.<|im_end|>", -0.5207002758979797, 0.7365241646766663, "Herald of arkell. As his trumpet blast sounded before the gate of the citadel, the free lord of arkell here giveth you word and warning that he will fight against you on the morrow. And from the citadel came back this ringing reply, as the knight of leyenburg made answer for his sovereign lady."], ["1", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>As his trumpet blast sounded out, he exclaimed, the freeborn flock will hear gibbetty's warning and warn him of a fight against you on the morrow. The horned giant came back with a ringing reply as the knight rode up at my aunt's house in the evening.<|im_end|>", -0.906722903251648, -1.383862853050232, "Herald of arkell. As his trumpet blast sounded before the gate of the citadel, the free lord of arkell here giveth you word and warning that he will fight against you on the morrow. And from the citadel came back this ringing reply, as the knight of leyenburg made answer for his sovereign lady."], ["1", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>As his trumpet blast sounded forth, he said, the free born robber here give a cheap word and warning that he will fight against you on the morrow. From the hill came back this ringing reply of the knight who had but lately entered into the city again.<|im_end|>", -0.3788970112800598, 1.5154365301132202, "Herald of arkell. As his trumpet blast sounded before the gate of the citadel, the free lord of arkell here giveth you word and warning that he will fight against you on the morrow. And from the citadel came back this ringing reply, as the knight of leyenburg made answer for his sovereign lady."]]}
|
wandb/run-20260417_123237-3h84yfea/files/media/table/completions_3_0656117578a4523e0161.table.json
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"columns": ["step", "prompt", "completion", "ASRWerSubLenCmpHalluDirtyV56", "advantages", "solution"], "data": [["5", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Coordinating and shifting, collectively said she who divided with each other in forming new combinations we must remember however that the flower worship of the teegos performed only a part of their ascetic ritual and it was not a distinct religion by itself.<|im_end|>", 0.14862142503261566, 0.6244527101516724, "kobori enshiu katagiri sekishiu vied with each other in forming new combinations we must remember however that the flower worship of the tea masters formed only a part of their aesthetic ritual and was not a distinct religion by itself"], ["5", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Kohori and shi no kafu ni sei shi no vie with each other in forming new combinations. We must remember, however, that the flower worship of the te deus was formed from only a part of their respective ritual, and it was not a distinct religion by itself.<|im_end|>", -0.41201284527778625, -2.48225474357605, "kobori enshiu katagiri sekishiu vied with each other in forming new combinations we must remember however that the flower worship of the tea masters formed only a part of their aesthetic ritual and was not a distinct religion by itself"], ["5", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Coordinating and shifting, coupling these symphysies, fighting with each other in forming new combinations. We must remember, however, that the flower worship of the timbuctoes formed only a part of their ascetic ritual, and was not a distinct religion by itself.<|im_end|>", 0.05453629419207573, 0.1030879095196724, "kobori enshiu katagiri sekishiu vied with each other in forming new combinations we must remember however that the flower worship of the tea masters formed only a part of their aesthetic ritual and was not a distinct religion by itself"], ["5", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Kohori and mushi, kafanguri and seshishi, fight with each other in forming new combinations. We must remember however that the flower worship of the teengus was formed from only a part of their respective ritual and it was not a distinct religion by itself.<|im_end|>", 0.14244088530540466, 0.5902037620544434, "kobori enshiu katagiri sekishiu vied with each other in forming new combinations we must remember however that the flower worship of the tea masters formed only a part of their aesthetic ritual and was not a distinct religion by itself"], ["5", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Coordinating and shifting, coupling these sub species by way with each other in forming new combinations. We must remember however that the flower worship of the tibetans was formed from only a part of their ascetic ritual, and it was not a distinct religion by itself.<|im_end|>", -0.07631387561559677, -0.6220072507858276, "kobori enshiu katagiri sekishiu vied with each other in forming new combinations we must remember however that the flower worship of the tea masters formed only a part of their aesthetic ritual and was not a distinct religion by itself"], ["5", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Co-ordinating shi'lu, collectively said yishu, vied with each other in forming new combinations. We must remember, however, that the flower worship of the tin gods was but only a part of their respective ritual and it was not a distinct religion by itself.<|im_end|>", 0.05551755055785179, 0.10852545499801636, "kobori enshiu katagiri sekishiu vied with each other in forming new combinations we must remember however that the flower worship of the tea masters formed only a part of their aesthetic ritual and was not a distinct religion by itself"], ["5", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Co-ordinating and shifting, collectively said she, fighting with each other in forming new combinations. We must remember, however, that the flower worship of the teentas was but only a part of their ascetic ritual, and it was not a distinct religion by itself.<|im_end|>", -0.08575789630413055, -0.6743404865264893, "kobori enshiu katagiri sekishiu vied with each other in forming new combinations we must remember however that the flower worship of the tea masters formed only a part of their aesthetic ritual and was not a distinct religion by itself"], ["5", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Cobordia and shibu, kathagunis and yishu divided with each other in forming new combinations. We must remember however that the flower worship of the teengus was formed from only a part of their accepted ritual, and it was not a distinct religion by itself.<|im_end|>", 0.07381142675876617, 0.2098994255065918, "kobori enshiu katagiri sekishiu vied with each other in forming new combinations we must remember however that the flower worship of the tea masters formed only a part of their aesthetic ritual and was not a distinct religion by itself"], ["5", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Coordinating and shifting, catalyzing and dissolving, vying with each other in forming new combinations. We must remember, however, that the flower worship of the tibetans was formed from only a part of their ascetic ritual, and it was not a distinct religion by itself.<|im_end|>", -0.07421640306711197, -0.6103842854499817, "kobori enshiu katagiri sekishiu vied with each other in forming new combinations we must remember however that the flower worship of the tea masters formed only a part of their aesthetic ritual and was not a distinct religion by itself"], ["5", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Kohori and mushi, kafanuise and yishi combined with each other in forming new combinations. We must remember however that the flower worship of the teungus was formed from only a part of their respective ritual and it was not a distinct religion by itself.<|im_end|>", 0.14416144788265228, 0.5997381210327148, "kobori enshiu katagiri sekishiu vied with each other in forming new combinations we must remember however that the flower worship of the tea masters formed only a part of their aesthetic ritual and was not a distinct religion by itself"], ["5", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Coordinating shiuk, collectively said, yishuk, fight with each other in forming new combinations. We must remember however that the flower worship of the tin gods was only a part of their accepted ritual and it was not a distinct religion by itself.<|im_end|>", 0.1842457801103592, 0.8218620419502258, "kobori enshiu katagiri sekishiu vied with each other in forming new combinations we must remember however that the flower worship of the tea masters formed only a part of their aesthetic ritual and was not a distinct religion by itself"], ["5", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Kohori and mushi, katakuri and saki shu, fight with each other in forming new combinations. We must remember however that the flower worship of the tea masters formed only a part of their ascetic ritual, and was not a distinct religion by itself.<|im_end|>", 0.27616366744041443, 1.3312172889709473, "kobori enshiu katagiri sekishiu vied with each other in forming new combinations we must remember however that the flower worship of the tea masters formed only a part of their aesthetic ritual and was not a distinct religion by itself"], ["5", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>With red hot boulders lying about everywhere, do you think it went off well? Creedle he asked, the victuals did that I know, and the drink did that I set fast to believe upon a sound of barrels good honest drink.<|im_end|>", 0.21575099229812622, 0.835888683795929, "with red hot bowlders lying about everywhere do you think it went off well creedle he asked the victuals did that i know and the drink did that i steadfastly believe from the holler sound of the barrels good honest drink"], ["5", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>With red hot bolters flying about everywhere, d'you think it went off well? Creedle he asked her. The bittles did that I know and the drink did that I said passed in belief up on the chaffin barrels good honest strength.<|im_end|>", -0.07250922918319702, -1.3199952840805054, "with red hot bowlders lying about everywhere do you think it went off well creedle he asked the victuals did that i know and the drink did that i steadfastly believe from the holler sound of the barrels good honest drink"], ["5", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>With red hot boulders flying about everywhere, d'you think it went off well at the cradle? He asked her the victuals did that I know and the drink did that I said passed me believe upon a sound of barrels good honest strength.<|im_end|>", -0.02524890936911106, -0.9665377140045166, "with red hot bowlders lying about everywhere do you think it went off well creedle he asked the victuals did that i know and the drink did that i steadfastly believe from the holler sound of the barrels good honest drink"], ["5", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>With red hot boulders lying about everywhere, do you think it went off well? Creedle he asked the victors did that I know and the drink did that I set fast to believe upon a sound of barrels good honest strength.<|im_end|>", 0.2779328227043152, 1.3009434938430786, "with red hot bowlders lying about everywhere do you think it went off well creedle he asked the victuals did that i know and the drink did that i steadfastly believe from the holler sound of the barrels good honest drink"], ["5", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>With red hot boulders lying about everywhere. D'you think it went off while a cradle? He asked her, the victuals did that I know and the drink did that I steadfastly believe upon a sound of barrels good honest drink.<|im_end|>", 0.23886768519878387, 1.0087772607803345, "with red hot bowlders lying about everywhere do you think it went off well creedle he asked the victuals did that i know and the drink did that i steadfastly believe from the holler sound of the barrels good honest drink"], ["5", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>With red hot boulders lying about everywhere, d'you think it went off while cradle? He asked her, the victuals did that I know and the drink did, that I said fastly believe upon a chance of barrels good honest drink.<|im_end|>", 0.015103586949408054, -0.6647433638572693, "with red hot bowlders lying about everywhere do you think it went off well creedle he asked the victuals did that i know and the drink did that i steadfastly believe from the holler sound of the barrels good honest drink"], ["5", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>With red hot boulders lying about everywhere, d'you think it went off well? Creel he asked her the victuals did that I know and the drink did that I said passed me believe up on a chaff in barrels good honest strength.<|im_end|>", -0.05440647527575493, -1.1846057176589966, "with red hot bowlders lying about everywhere do you think it went off well creedle he asked the victuals did that i know and the drink did that i steadfastly believe from the holler sound of the barrels good honest drink"], ["5", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>With red hot boulders lying about everywhere. Did you think it went off well, creedle? He asked me. The victuals did that I know and the drink did, that I said, must be believe upon a sound of barrels good honest strength.<|im_end|>", 0.08476551622152328, -0.14374522864818573, "with red hot bowlders lying about everywhere do you think it went off well creedle he asked the victuals did that i know and the drink did that i steadfastly believe from the holler sound of the barrels good honest drink"], ["5", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>With red hot boulders flying about everywhere. D'you think it went off well, creel? He asked her. The victuals did that I know and the drink did that I steadfastly believe upon a sound of barrels good honest strength.<|im_end|>", 0.2250947505235672, 0.9057701826095581, "with red hot bowlders lying about everywhere do you think it went off well creedle he asked the victuals did that i know and the drink did that i steadfastly believe from the holler sound of the barrels good honest drink"], ["5", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>With red hot bolters flying about everywhere, do you think it went off well? Creel he asked. The biddles did that I know and the drink did that I steadfastly believe upon a sound of barrels good honest drink.<|im_end|>", 0.27579447627067566, 1.2849509716033936, "with red hot bowlders lying about everywhere do you think it went off well creedle he asked the victuals did that i know and the drink did that i steadfastly believe from the holler sound of the barrels good honest drink"], ["5", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>With red hot boulders lying about everywhere, do you think it went off while in the cradle? He asked her. The victuals did that I know, and the drink did that I said passed me believe upon a sound of barrels good honest drink.<|im_end|>", 0.03807579353451729, -0.4929353892803192, "with red hot bowlders lying about everywhere do you think it went off well creedle he asked the victuals did that i know and the drink did that i steadfastly believe from the holler sound of the barrels good honest drink"], ["5", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>With red hot boulders flying about everywhere. D'you think it went off well, creedle? He asked her. The victuals did that I know and the drink did that I set fast in believe upon a sound of barrels good honest drink.<|im_end|>", 0.028604861348867416, -0.5637679696083069, "with red hot bowlders lying about everywhere do you think it went off well creedle he asked the victuals did that i know and the drink did that i steadfastly believe from the holler sound of the barrels good honest drink"], ["5", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>For it is wonderful how names can be acquired by some means. The writer was once employed in teaching a course of lectures to his friends, and repeated very handsome gilding on the colonies of babies which seemed to answer just at once.<|im_end|>", -0.5981812477111816, -0.7124949097633362, "For it is wonderful how soon these are acquired by some horses. The writer was once employed to purchase a horse for a country friend. And he picked a very handsome gelding out of collins's stables, which seemed to answer to his friend's wants."], ["5", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>For it is wonderful how many things may be acquired by some means. The writer was once employed in teaching a boy his arithmetic to French, and repeated very handsome gilding on the colonies of babies, which seems answer to the parents wants.<|im_end|>", -0.6030839681625366, -0.7439505457878113, "For it is wonderful how soon these are acquired by some horses. The writer was once employed to purchase a horse for a country friend. And he picked a very handsome gelding out of collins's stables, which seemed to answer to his friend's wants."], ["5", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>For it is wonderful how a name can be acquired by some means. The writer was once employed in purchasing a horse for his brother's friend, and he picked up mary hansen gelding on the collins estate, which seems answer to his friend's wants.<|im_end|>", -0.16422338783740997, 2.071758270263672, "For it is wonderful how soon these are acquired by some horses. The writer was once employed to purchase a horse for a country friend. And he picked a very handsome gelding out of collins's stables, which seemed to answer to his friend's wants."], ["5", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>For it is wonderful how many names have been supplied by some of us. The writer was once employed in teaching a course of lectures on French, and repeated Mary hansen gellin on the colonies of ladies, which seems answerable to his friend's wants.<|im_end|>", -0.6562139391899109, -1.0848299264907837, "For it is wonderful how soon these are acquired by some horses. The writer was once employed to purchase a horse for a country friend. And he picked a very handsome gelding out of collins's stables, which seemed to answer to his friend's wants."], ["5", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>For it is wonderful how many things can be acquired by some means a writer was once employed in preaching authority from scripture to friends, and he picked up mary hansen gelding on the colony of cape town, which seems answer to his friend's wants.<|im_end|>", -0.48777177929878235, -0.00411293376237154, "For it is wonderful how soon these are acquired by some horses. The writer was once employed to purchase a horse for a country friend. And he picked a very handsome gelding out of collins's stables, which seemed to answer to his friend's wants."], ["5", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>For it is wonderful how names may be acquired by some means a writer was once employed in purchase of horses from a friend and repeated mary hansen gilding on the colony of scotland which seems answer to his friend's want.<|im_end|>", -0.45017996430397034, 0.23707440495491028, "For it is wonderful how soon these are acquired by some horses. The writer was once employed to purchase a horse for a country friend. And he picked a very handsome gelding out of collins's stables, which seemed to answer to his friend's wants."], ["5", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>For it is wonderful how men can be inspired by some of these things. The writer was once employed in purchase of horses from his friends, and they picked up very handsome geldings on the colonies of cape verd which seemed to answer just such wants.<|im_end|>", -0.5413256883621216, -0.34771230816841125, "For it is wonderful how soon these are acquired by some horses. The writer was once employed to purchase a horse for a country friend. And he picked a very handsome gelding out of collins's stables, which seemed to answer to his friend's wants."], ["5", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>For it is wonderful how names may be acquired by some means a writer was once employed in purchase of one such book from his friend and repeated mary hansen gelling on the colonies of ceders which seems answer to his friend's wants.<|im_end|>", -0.5219820141792297, -0.2236042022705078, "For it is wonderful how soon these are acquired by some horses. The writer was once employed to purchase a horse for a country friend. And he picked a very handsome gelding out of collins's stables, which seemed to answer to his friend's wants."], ["5", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>For it is wonderful how a name can be acquired by some means. The writer was once employed in teaching a course of lectures on French, and repeated Mary henson gilding on the colonies of Canada, which seems answer to his friend's wants.<|im_end|>", -0.4530133306980133, 0.21889565885066986, "For it is wonderful how soon these are acquired by some horses. The writer was once employed to purchase a horse for a country friend. And he picked a very handsome gelding out of collins's stables, which seemed to answer to his friend's wants."], ["5", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>For it is wonderful how many things are required by some of us. The writer was once employed in preaching before a large company at friends, and repeated with very handsome gilding on the columns of statius which seems answer to his friend's wants.<|im_end|>", -0.5449039340019226, -0.3706701695919037, "For it is wonderful how soon these are acquired by some horses. The writer was once employed to purchase a horse for a country friend. And he picked a very handsome gelding out of collins's stables, which seemed to answer to his friend's wants."], ["5", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>For it is wonderful how many things can be acquired by some means a writer was once employed in purchase of horses from his friends and he picked up very handsome geldings on the colonies of cape cruz which seemed to answer to his friend's wants.<|im_end|>", -0.20373354852199554, 1.8182631731033325, "For it is wonderful how soon these are acquired by some horses. The writer was once employed to purchase a horse for a country friend. And he picked a very handsome gelding out of collins's stables, which seemed to answer to his friend's wants."], ["5", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>For it is wonderful how men may be inspired by some muse a writer was once employed in which office he got continual friends and made pictures very handsome gilding on the columns of statues which seems answer to his friend's wants.<|im_end|>", -0.6209558844566345, -0.8586159348487854, "For it is wonderful how soon these are acquired by some horses. The writer was once employed to purchase a horse for a country friend. And he picked a very handsome gelding out of collins's stables, which seemed to answer to his friend's wants."], ["5", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>A week after the battle, my brother replied there on a capital expedition to make a horrible discovery that involved eating up the bodies of our dead heroes. That too was worth it.<|im_end|>", 0.11993206292390823, 0.7482782602310181, "a week after the battle my brother rode by there on a cavalry expedition and made the horrible discovery that hogs were eating up the bodies of our dead heroes that too was war"], ["5", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>A week after the battle, my brother was invited by a cavalry expedition to make a horrible supper at a hall in the eating of the bodies of our dead heroes. That too is over.<|im_end|>", -0.41032978892326355, -1.1197341680526733, "a week after the battle my brother rode by there on a cavalry expedition and made the horrible discovery that hogs were eating up the bodies of our dead heroes that too was war"], ["5", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>A week after the battle, my brother took a lighter and captured my expedition to make the horrible discovery that all were eating up the bodies of our dead heroes. That too was worth it.<|im_end|>", 0.021145427599549294, 0.40027153491973877, "a week after the battle my brother rode by there on a cavalry expedition and made the horrible discovery that hogs were eating up the bodies of our dead heroes that too was war"], ["5", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>A week after the battle, my brother stood by her on the scaffold in my position and made a horrible discovery that I had caught the beating of the pines of our dead heroes. That too was worth it.<|im_end|>", -0.47986671328544617, -1.3646996021270752, "a week after the battle my brother rode by there on a cavalry expedition and made the horrible discovery that hogs were eating up the bodies of our dead heroes that too was war"], ["5", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>A week after the battle, my brother was invited by a capital man of business to make a horrible discovery at home, eating up the bodies of our dead heroes. That too was worth it.<|im_end|>", -0.32124173641204834, -0.8058937788009644, "a week after the battle my brother rode by there on a cavalry expedition and made the horrible discovery that hogs were eating up the bodies of our dead heroes that too was war"], ["5", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>A week after the battle, my brother replied there in a cavalry expedition to make a horrible discovery at home of the bodies of our dead heroes. That too was worth it.<|im_end|>", -0.12081809341907501, -0.09983913600444794, "a week after the battle my brother rode by there on a cavalry expedition and made the horrible discovery that hogs were eating up the bodies of our dead heroes that too was war"], ["5", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>A week after the battle, my brother replied there in a capital translation to me the horrible discovery that all were eating up the bodies of our dead heroes. That too was worth it.<|im_end|>", 0.1116841584444046, 0.7192224264144897, "a week after the battle my brother rode by there on a cavalry expedition and made the horrible discovery that hogs were eating up the bodies of our dead heroes that too was war"], ["5", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>A week after the battle, my brother was invited by our cavalry expedition to make a horrible supper at a hall meeting of the bodies of our dead heroes. That too was ordered.<|im_end|>", -0.3647739291191101, -0.9592495560646057, "a week after the battle my brother rode by there on a cavalry expedition and made the horrible discovery that hogs were eating up the bodies of our dead heroes that too was war"], ["5", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>A week after the battle, my brother replied there from the capital of my expedition, he made a horrible discovery that called for eating up the bodies of our dead heroes. That too was ordered.<|im_end|>", -0.16730603575706482, -0.263607382774353, "a week after the battle my brother rode by there on a cavalry expedition and made the horrible discovery that hogs were eating up the bodies of our dead heroes that too was war"], ["5", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>A week after the battle, my brother replied there from a cavalry expedition and made a horrible discovery that called the eating of the bodies of our dead heroes. That too was war.<|im_end|>", 0.26659682393074036, 1.2649505138397217, "a week after the battle my brother rode by there on a cavalry expedition and made the horrible discovery that hogs were eating up the bodies of our dead heroes that too was war"], ["5", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>A week after the battle, my brother replied there on a capital expedition to make the horrible discovery that he had fallen in the eating of the pies of our dead heroes. That too was a word.<|im_end|>", -0.18637478351593018, -0.3307829797267914, "a week after the battle my brother rode by there on a cavalry expedition and made the horrible discovery that hogs were eating up the bodies of our dead heroes that too was war"], ["5", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>A week after the battle, my brother rode by there on a cavalry expedition to make the horrible discovery that Paul was eating up the bodies of our dead heroes. That too is worth.<|im_end|>", 0.4216246008872986, 1.8110840320587158, "a week after the battle my brother rode by there on a cavalry expedition and made the horrible discovery that hogs were eating up the bodies of our dead heroes that too was war"]]}
|
wandb/run-20260417_123237-3h84yfea/files/media/table/completions_5_f2bf6a8e887194296a09.table.json
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"columns": ["step", "prompt", "completion", "ASRWerSubLenCmpHalluDirtyV56", "advantages", "solution"], "data": [["10", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Instead of listening to you, I tell you that from this day forward, I will give that great man a pension of a thousand pieces of gold per month for his life. Nay, though I were to share with him all my riches and dominions.<|im_end|>", 0.7513310313224792, -0.40651965141296387, "instead of listening to you i tell you that from this day forward i will give that great man a pension of a thousand pieces of gold per month for his life nay though i were to share with him all my riches and dominions"], ["10", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Instead of listening to you, I tell you that from this day forward, I will give that great man a pension of a thousand pieces of gold per month for his life. Nay, though I were to share with him all my riches and provisions.<|im_end|>", 0.7468931674957275, -0.49668067693710327, "instead of listening to you i tell you that from this day forward i will give that great man a pension of a thousand pieces of gold per month for his life nay though i were to share with him all my riches and dominions"], ["10", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Instead of listening to you, I tell you that from this day forward, I will give that great man a pension of a thousand pieces of gold per month for his life. Nay, though I were to share with him all my riches and dominions.<|im_end|>", 0.7513310313224792, -0.40651965141296387, "instead of listening to you i tell you that from this day forward i will give that great man a pension of a thousand pieces of gold per month for his life nay though i were to share with him all my riches and dominions"], ["10", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Instead of listening to you, I tell you that from this day forward, I will give that great man a pension of a thousand pieces of gold per month for his life. Nay, though I were to share with him all my riches and dominions.<|im_end|>", 0.7513310313224792, -0.40651965141296387, "instead of listening to you i tell you that from this day forward i will give that great man a pension of a thousand pieces of gold per month for his life nay though i were to share with him all my riches and dominions"], ["10", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Instead of listening to you, I tell you that from this day forward, I will give that great man a pension of a thousand pieces of gold per month for his life. Nay, though I were to share with him all my riches and dominions.<|im_end|>", 0.7513310313224792, -0.40651965141296387, "instead of listening to you i tell you that from this day forward i will give that great man a pension of a thousand pieces of gold per month for his life nay though i were to share with him all my riches and dominions"], ["10", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Instead of listening to you, I tell you that from this day forward, I will give that great man a pension of a thousand pieces of gold per month for his life. Nay, though I were to share with him all my riches and dominions.<|im_end|>", 0.7513310313224792, -0.40651965141296387, "instead of listening to you i tell you that from this day forward i will give that great man a pension of a thousand pieces of gold per month for his life nay though i were to share with him all my riches and dominions"], ["10", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Instead of listening to you, I tell you that from this day forward, I will give that great man a pension of a thousand pieces of gold per month for his life. Nay, though I were to share with him all my riches and dominions.<|im_end|>", 0.7513310313224792, -0.40651965141296387, "instead of listening to you i tell you that from this day forward i will give that great man a pension of a thousand pieces of gold per month for his life nay though i were to share with him all my riches and dominions"], ["10", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Instead of listening to you, I tell you that from this day forward, I will give that great man a pension of a thousand pieces of gold per month for his life. Nay, though I were to share with him all my riches and dominions.<|im_end|>", 0.7513310313224792, -0.40651965141296387, "instead of listening to you i tell you that from this day forward i will give that great man a pension of a thousand pieces of gold per month for his life nay though i were to share with him all my riches and dominions"], ["10", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Instead of listening to you, I tell you that from this day forward I will give that great man a pension of a thousand pieces of gold per month for his life nay, though I were to share with him all my riches and provisions<|im_end|>", 0.8469211459159851, 1.5355191230773926, "instead of listening to you i tell you that from this day forward i will give that great man a pension of a thousand pieces of gold per month for his life nay though i were to share with him all my riches and dominions"], ["10", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Instead of listening to you, I tell you that from this day forward, I will give that great man a pension of a thousand pieces of gold per month for his life nay though I were to share with him all my riches and dominions<|im_end|>", 0.9002925753593445, 2.6198298931121826, "instead of listening to you i tell you that from this day forward i will give that great man a pension of a thousand pieces of gold per month for his life nay though i were to share with him all my riches and dominions"], ["10", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Instead of listening to you, I tell you that from this day forward, I will give that great man a pension of a thousand pieces of gold per month for his life. Nay, though I were to share with him all my riches and dominions.<|im_end|>", 0.7513310313224792, -0.40651965141296387, "instead of listening to you i tell you that from this day forward i will give that great man a pension of a thousand pieces of gold per month for his life nay though i were to share with him all my riches and dominions"], ["10", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Instead of listening to you, I tell you that from this day forward, I will give that great man a pension of a thousand pieces of gold per month for his life. Nay, though I were to share with him all my riches and dominions.<|im_end|>", 0.7513310313224792, -0.40651965141296387, "instead of listening to you i tell you that from this day forward i will give that great man a pension of a thousand pieces of gold per month for his life nay though i were to share with him all my riches and dominions"], ["10", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>The baker shook his head, the crime which I have committed now or has no place among you in justice. And you can only deliver me from it by blessing me secretly as you have just done come, put hand before the persecutor.<|im_end|>", -0.023505905643105507, -0.4367395341396332, "The beggar shook his head. The crime which I have committed, my lord, has no call upon human justice. And you can only deliver me from it by blessing me frequently, as you have just done. Come be candid, said the coadjutor."], ["10", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>The baker shook his head, the crime which I have committed now will have no cause of human injustice. And you can only deliver me from it by blessing this wicked day as you have just done. Come, my candids said the presider.<|im_end|>", -0.021910538896918297, -0.4288407862186432, "The beggar shook his head. The crime which I have committed, my lord, has no call upon human justice. And you can only deliver me from it by blessing me frequently, as you have just done. Come be candid, said the coadjutor."], ["10", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>The baker shook his head, the crime which I have committed now will be called upon you in justice and you can only deliver me from it by blessing this sacred day as you have just done come let's end it said the presider.<|im_end|>", -0.23740261793136597, -1.495755672454834, "The beggar shook his head. The crime which I have committed, my lord, has no call upon human justice. And you can only deliver me from it by blessing me frequently, as you have just done. Come be candid, said the coadjutor."], ["10", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>The baker shook his head, but the crime which I have committed now is too large for any injustice and you can only deliver me from it by blessing me secretly as you have just done. Come up hand before the persecutor.<|im_end|>", -0.08132755011320114, -0.7230181097984314, "The beggar shook his head. The crime which I have committed, my lord, has no call upon human justice. And you can only deliver me from it by blessing me frequently, as you have just done. Come be candid, said the coadjutor."], ["10", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>The baker shook his head, the crime which I have committed now or has just passed on me of justice and you can only deliver me from it by blessing me frequently as you have just done come with candor said the presider.<|im_end|>", -0.018306119367480278, -0.4109950661659241, "The beggar shook his head. The crime which I have committed, my lord, has no call upon human justice. And you can only deliver me from it by blessing me frequently, as you have just done. Come be candid, said the coadjutor."], ["10", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>The baker shook his head, the crime which I have committed now won't hold you call upon human justice, and you can only deliver me from it by blessing this secret way as you have just done. Come with candor said the persecutor.<|im_end|>", 0.11918030679225922, 0.26970887184143066, "The beggar shook his head. The crime which I have committed, my lord, has no call upon human justice. And you can only deliver me from it by blessing me frequently, as you have just done. Come be candid, said the coadjutor."], ["10", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>The baker shook his head. The crime which I have committed, my lord has no cause of human justice, and you can only deliver me from it by blessing me frequently as you have just done come with candor said the presider.<|im_end|>", 0.3861045837402344, 1.591267704963684, "The beggar shook his head. The crime which I have committed, my lord, has no call upon human justice. And you can only deliver me from it by blessing me frequently, as you have just done. Come be candid, said the coadjutor."], ["10", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>The beggar shook his head, the crime which I have committed now or has been called upon me by justice, and you can only deliver me from it by blessing me secretly as you have just done come with candor said the porter to juno.<|im_end|>", 0.011092587374150753, -0.2654402256011963, "The beggar shook his head. The crime which I have committed, my lord, has no call upon human justice. And you can only deliver me from it by blessing me frequently, as you have just done. Come be candid, said the coadjutor."], ["10", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>The beggar shook his head, the crime which I have committed now would have no place among you in justice, and you can only deliver me from it by blessing me frequently as you have just done come with candids said the porter turtle.<|im_end|>", -0.0024881232529878616, -0.3326791822910309, "The beggar shook his head. The crime which I have committed, my lord, has no call upon human justice. And you can only deliver me from it by blessing me frequently, as you have just done. Come be candid, said the coadjutor."], ["10", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>The beggar shook his head, the crime which I have committed, my lord has no palliation in justice, and you can only deliver me from it by blessing me frequently as you have just done. Come with candor said the procurator.<|im_end|>", 0.3988274335861206, 1.6542593240737915, "The beggar shook his head. The crime which I have committed, my lord, has no call upon human justice. And you can only deliver me from it by blessing me frequently, as you have just done. Come be candid, said the coadjutor."], ["10", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>The beggar shook his head, the crime which I have committed, my lord, has no place among you in justice, and you can only deliver me from it by blessing me secretly as you have just done come with candids said the presbyter.<|im_end|>", 0.32486215233802795, 1.2880525588989258, "The beggar shook his head. The crime which I have committed, my lord, has no call upon human justice. And you can only deliver me from it by blessing me frequently, as you have just done. Come be candid, said the coadjutor."], ["10", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>The beggar shook his head, decline which I have permitted my lord has no cause for any injustice and you can only deliver me from it by blessing us equally as you have just done come but hand it to the procurator.<|im_end|>", -0.07866184413433075, -0.709820032119751, "The beggar shook his head. The crime which I have committed, my lord, has no call upon human justice. And you can only deliver me from it by blessing me frequently, as you have just done. Come be candid, said the coadjutor."], ["10", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>What was Hamphill's great and enduring jubilation with the emotions that stirred within him when he first bushwhacked his seeming grey matter? It was stirred the remembrance that Pontiac had warned them that women were robbing the house you mean a woman.<|im_end|>", -0.49033617973327637, 0.36183518171310425, "the buttons on phelan's coat were fairly undulating with the emotions that stirred within him in his seething gray matter there stirred the remembrance that bateato had told him that women were robbing the house you mean the women"], ["10", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>What was Hamphair's great concern, accumulating with the emotions that stirred within him when he first bushwhacked his seemingly gray matter? There stirred the remembrance that but a few moments ago, that women were robbing the house you mean the women.<|im_end|>", -0.30832746624946594, 0.963458776473999, "the buttons on phelan's coat were fairly undulating with the emotions that stirred within him in his seething gray matter there stirred the remembrance that bateato had told him that women were robbing the house you mean the women"], ["10", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>So she did button some papers away and started accumulating with the emotions that stirred within one night for a first bushwacker in his seeming gray matter there stirred the remembrance that monte agello had told them women were robbing the house you mean the sheriff<|im_end|>", -0.4897034466266632, 0.3639266788959503, "the buttons on phelan's coat were fairly undulating with the emotions that stirred within him in his seething gray matter there stirred the remembrance that bateato had told him that women were robbing the house you mean the women"], ["10", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>The buttons of phaeton's coat were accumulating with the emotions that stirred within one at first bushwick in his seeming gray matter there stirred the remembrance that monteagle had told them women were riding the house you mean a woman<|im_end|>", 0.051824573427438736, 2.1539289951324463, "the buttons on phelan's coat were fairly undulating with the emotions that stirred within him in his seething gray matter there stirred the remembrance that bateato had told him that women were robbing the house you mean the women"], ["10", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>But in some paler, gray and dreary, accumulating with the emotions that stirred within one like hers bushwick's eyes did seem in grey matter there stirred the remembrance that batty apples had been at Quinn's for riding the house you mean the sheriff?<|im_end|>", -0.8388098478317261, -0.7900326251983643, "the buttons on phelan's coat were fairly undulating with the emotions that stirred within him in his seething gray matter there stirred the remembrance that bateato had told him that women were robbing the house you mean the women"], ["10", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>She caught some faint expression of fear, mingling with the emotions that stirred within her when she first beheld this hideous beast. His seeming gray matter evoked the remembrance that battyappo had told them women were rotting in the house you mean a woman?<|im_end|>", -0.7576847672462463, -0.5218764543533325, "the buttons on phelan's coat were fairly undulating with the emotions that stirred within him in his seething gray matter there stirred the remembrance that bateato had told him that women were robbing the house you mean the women"], ["10", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>But some feelings which were accumulating with the emotions that stirred within one's heart for a perverse bushman did seem in gray matter to stir the remembrance that botany had reported that women were riding the house you mean, of women.<|im_end|>", -0.6848458051681519, -0.2811097204685211, "the buttons on phelan's coat were fairly undulating with the emotions that stirred within him in his seething gray matter there stirred the remembrance that bateato had told him that women were robbing the house you mean the women"], ["10", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>What had some feelings greatly intermingling with the emotions that stirred within one at first bushwick and his seemingly gray matter there stirred the remembrance that but a few weeks ago, when women were rioting in the house you mean the sheriff<|im_end|>", -0.537434458732605, 0.20615343749523163, "the buttons on phelan's coat were fairly undulating with the emotions that stirred within him in his seething gray matter there stirred the remembrance that bateato had told him that women were robbing the house you mean the women"], ["10", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>So she did buttons of phaeton's face was very stimulating with the emotions that stirred within one like her own it seemed in gray matter there stirred the remembrance that but a half hour ago, that women were riding the house you mean the women.<|im_end|>", -0.5774927735328674, 0.07374204695224762, "the buttons on phelan's coat were fairly undulating with the emotions that stirred within him in his seething gray matter there stirred the remembrance that bateato had told him that women were robbing the house you mean the women"], ["10", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>She thought some palates of bacon, and very stimulating with the emotions that stirred within one heart for the first bushwacker in his seeming gray matter there stirred the remembrance that but a little before that women were riding the house you mean a woman.<|im_end|>", -0.5789588689804077, 0.06889592111110687, "the buttons on phelan's coat were fairly undulating with the emotions that stirred within him in his seething gray matter there stirred the remembrance that bateato had told him that women were robbing the house you mean the women"], ["10", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>To shiver buttons had failed to wake him and he was still accumulating with the emotions that stirred within him when they first met in his seemingly grey matter there stirred the remembrance that but a few weeks before women were riding the house you mean the ship?<|im_end|>", -0.8068899512290955, -0.6845225095748901, "the buttons on phelan's coat were fairly undulating with the emotions that stirred within him in his seething gray matter there stirred the remembrance that bateato had told him that women were robbing the house you mean the women"], ["10", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>So she heard buttons, having failed to wake him, began accumulating with the emotions that stirred within her when he first pushed me aside in his seemingly grave manner and restored the remembrance that battyata was one of them who were riding the house you mean a servant.<|im_end|>", -1.1789628267288208, -1.9143966436386108, "the buttons on phelan's coat were fairly undulating with the emotions that stirred within him in his seething gray matter there stirred the remembrance that bateato had told him that women were robbing the house you mean the women"], ["10", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>They set up the side show early in the morning before the first guest arrived at park.<|im_end|>", 0.5806475877761841, -0.7072128057479858, "They set up the sideshow early in the morning before the first guests arrived at park."], ["10", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>They set up the side show early in the morning before the first guests arrived at park.<|im_end|>", 0.7450000047683716, 0.4686703085899353, "They set up the sideshow early in the morning before the first guests arrived at park."], ["10", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>They set up the side show early in the morning before the first guests arrived at park.<|im_end|>", 0.7450000047683716, 0.4686703085899353, "They set up the sideshow early in the morning before the first guests arrived at park."], ["10", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>They set up the side show early in the morning before the first guest arrived at park.<|im_end|>", 0.5806475877761841, -0.7072128057479858, "They set up the sideshow early in the morning before the first guests arrived at park."], ["10", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>They set up the side show early in the morning before the first guest arrived at park.<|im_end|>", 0.5806475877761841, -0.7072128057479858, "They set up the sideshow early in the morning before the first guests arrived at park."], ["10", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>They set up the side show early in the morning before the first guest arrived at park.<|im_end|>", 0.5806475877761841, -0.7072128057479858, "They set up the sideshow early in the morning before the first guests arrived at park."], ["10", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>They set up the side show early in the morning before the first guest arrived at park.<|im_end|>", 0.5806475877761841, -0.7072128057479858, "They set up the sideshow early in the morning before the first guests arrived at park."], ["10", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>They set up the side show early in the morning before the first guests arrived at park.<|im_end|>", 0.7450000047683716, 0.4686703085899353, "They set up the sideshow early in the morning before the first guests arrived at park."], ["10", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>They set up the sideshow early in the morning before the first guest arrived at park.<|im_end|>", 0.8543975949287415, 1.251371145248413, "They set up the sideshow early in the morning before the first guests arrived at park."], ["10", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>They set up the side show early in the morning before the first guest arrived at park.<|im_end|>", 0.5806475877761841, -0.7072128057479858, "They set up the sideshow early in the morning before the first guests arrived at park."], ["10", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>They set up the sideshow early in the morning before the first guests arrived at park.<|im_end|>", 1.0, 2.293104648590088, "They set up the sideshow early in the morning before the first guests arrived at park."], ["10", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>They set up the side show early in the morning before the first guest arrived at park.<|im_end|>", 0.5806475877761841, -0.7072128057479858, "They set up the sideshow early in the morning before the first guests arrived at park."]]}
|
wandb/run-20260417_123237-3h84yfea/files/media/table/completions_7_4930391b310cfe338705.table.json
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"columns": ["step", "prompt", "completion", "ASRWerSubLenCmpHalluDirtyV56", "advantages", "solution"], "data": [["15", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>darted furious glances at one another what they meant certainly which looked well for us all got out a long box and sawn it in severe weather well every ship drew upon side five on the other with a pit between us<|im_end|>", -0.711168646812439, -1.6506024599075317, "darting furious glances behind them one thing i observed which looked well for us they all got out upon the opposite side from silver well there we stood two on one side five on the other the pit between us"], ["15", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Darling, furious glances were coming from her one thing I am certain which looked well for us all got out along tops and sides of this hill well there we stood two on one side five on the other with a pit between us<|im_end|>", -0.056266773492097855, 0.6078363656997681, "darting furious glances behind them one thing i observed which looked well for us they all got out upon the opposite side from silver well there we stood two on one side five on the other the pit between us"], ["15", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>darted furious glances in our direction. One thing I am certain, which looked well for us, we all got out upon puffs and sighs of superiority. Well, every stroke two on one side five on the other was a pity to me as.<|im_end|>", -0.5369827151298523, -1.0499197244644165, "darting furious glances behind them one thing i observed which looked well for us they all got out upon the opposite side from silver well there we stood two on one side five on the other the pit between us"], ["15", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>darted furious glances about one thing I am certain which looked well for us all got out of our cloaks and stockings well every ship drew upon side five on the other to pick each others<|im_end|>", -0.4635177254676819, -0.796574592590332, "darting furious glances behind them one thing i observed which looked well for us they all got out upon the opposite side from silver well there we stood two on one side five on the other the pit between us"], ["15", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>darting furious glances at one another, one thing i am certain which looked well for us we all got out on the opposite side and disappeared. Well, there we stood two upon one side five on the other in a pit between us.<|im_end|>", 0.12982679903507233, 1.2495828866958618, "darting furious glances behind them one thing i observed which looked well for us they all got out upon the opposite side from silver well there we stood two on one side five on the other the pit between us"], ["15", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>darted furious glances about one thing I am certain which looked well for us we all got out upon blocks and sides of the sewer well there we stood two on one side five on the other with a pit between us<|im_end|>", 0.13510093092918396, 1.267770767211914, "darting furious glances behind them one thing i observed which looked well for us they all got out upon the opposite side from silver well there we stood two on one side five on the other the pit between us"], ["15", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Darling furious and lenses were out of order one thing I am certain which looked well for us we all got out upon tops and sides in the severe weather well there we stood two on one side five on the other the pit between us<|im_end|>", -0.07753195613622665, 0.5345030426979065, "darting furious glances behind them one thing i observed which looked well for us they all got out upon the opposite side from silver well there we stood two on one side five on the other the pit between us"], ["15", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>darted furious glances about one thing I am certain which looked well for us all got out of our cloths and stockings and stood up well every ship two on one side five on the other with a pit between us<|im_end|>", -0.21955648064613342, 0.04472939670085907, "darting furious glances behind them one thing i observed which looked well for us they all got out upon the opposite side from silver well there we stood two on one side five on the other the pit between us"], ["15", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Darling, furious and wenceslas had been there. One thing I am certain which looked well for us all got out upon foxes' side. It was clear enough. Well, every ship drew one side five on the other to pit between us.<|im_end|>", -0.45566949248313904, -0.7695098519325256, "darting furious glances behind them one thing i observed which looked well for us they all got out upon the opposite side from silver well there we stood two on one side five on the other the pit between us"], ["15", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>darting furious glances about one thing I am certain, which looked well for us, they all got out of our plots and sawdust in a secure way well every stroke drew upon one side five on the other the pit being full as<|im_end|>", -0.4559590816497803, -0.7705084681510925, "darting furious glances behind them one thing i observed which looked well for us they all got out upon the opposite side from silver well there we stood two on one side five on the other the pit between us"], ["15", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Darting furious glances about them one thing I am certain which looked well for us all got out a long cloth and sat in the middle of it well there we stood two on one side, five on the other with a picnic box<|im_end|>", -0.2022235095500946, 0.10450240224599838, "darting furious glances behind them one thing i observed which looked well for us they all got out upon the opposite side from silver well there we stood two on one side five on the other the pit between us"], ["15", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>darted furious glances about them one thing I am certain which looked well for us all got out along tops and sides of this hill well there we stood two on one side five on the other to pick between us<|im_end|>", 0.12362368404865265, 1.2281913757324219, "darting furious glances behind them one thing i observed which looked well for us they all got out upon the opposite side from silver well there we stood two on one side five on the other the pit between us"], ["15", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>I would have cherished you with all my heart, said Peterloo as we might be separated to a citizen of another world. But let's converse with regard to those who have grown up in another land and who soon after arriving here are engaged in our service.<|im_end|>", -0.25535303354263306, -0.2316378802061081, "are both opposed to the formation of such views and habits as we think desirable to the citizen of the new world we answer first with regard to those who have grown up in another land and who soon after arriving here are engaged in our service"], ["15", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Are both of a distinguished and noble descent in these islands, as we might be said to be citizens of every world. The next verse is with regard to those who have grown up in another land and who soon after arriving here are engaged in our service.<|im_end|>", -0.19704824686050415, 0.17174986004829407, "are both opposed to the formation of such views and habits as we think desirable to the citizen of the new world we answer first with regard to those who have grown up in another land and who soon after arriving here are engaged in our service"], ["15", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Our brother ships should be called in such cases as these and matters, as we might consider them to a citizen of your own world, events of personal regard to those who have grown up in another land and who soon after arriving here are engaged in our service.<|im_end|>", -0.29079490900039673, -0.47684618830680847, "are both opposed to the formation of such views and habits as we think desirable to the citizen of the new world we answer first with regard to those who have grown up in another land and who soon after arriving here are engaged in our service"], ["15", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Our brothers, who have gone before us into these lands, as we might consider him to be a citizen of our own world. The next verse with regard to those who have grown up in another land and who soon after arriving here are engaged in our service.<|im_end|>", -0.3025875687599182, -0.5584349632263184, "are both opposed to the formation of such views and habits as we think desirable to the citizen of the new world we answer first with regard to those who have grown up in another land and who soon after arriving here are engaged in our service"], ["15", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Our obligations to your royal majesty extend to these premises as we might be said to have to a citizen of the old world in answer first with regard to those who have grown up in another land and who soon after arriving here are engaged in our service.<|im_end|>", -0.027638815343379974, 1.3438266515731812, "are both opposed to the formation of such views and habits as we think desirable to the citizen of the new world we answer first with regard to those who have grown up in another land and who soon after arriving here are engaged in our service"], ["15", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Are both distinguished by their voluntary services to these islands, as we might be said of him who is a citizen of every world. The next reverse with regard to those who have grown up in another land and who soon after arriving here are engaged in our service.<|im_end|>", -0.32690533995628357, -0.7266799807548523, "are both opposed to the formation of such views and habits as we think desirable to the citizen of the new world we answer first with regard to those who have grown up in another land and who soon after arriving here are engaged in our service"], ["15", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Are of a special duty of honour and respect to these inhabitants, as we might consider him to be a citizen of their own world. The next in personal regard to those who have grown up in another land, and who soon after arriving here are engaged in our service.<|im_end|>", -0.4352739751338959, -1.4764397144317627, "are both opposed to the formation of such views and habits as we think desirable to the citizen of the new world we answer first with regard to those who have grown up in another land and who soon after arriving here are engaged in our service"], ["15", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Are of a just and good moral disposition, as we might conceive them to be citizens of our own world. They answer first with regard to those who have grown up in another land and who, soon after arriving here, are engaged in our service.<|im_end|>", -0.22580717504024506, -0.027221782132983208, "are both opposed to the formation of such views and habits as we think desirable to the citizen of the new world we answer first with regard to those who have grown up in another land and who soon after arriving here are engaged in our service"], ["15", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Our brothers, who have fallen in service to these commandments as we might consider them to a citizen of our own land, and answer first with regard to those who have grown up in another land and who soon after arriving here are engaged in our service.<|im_end|>", -0.11624263226985931, 0.7308119535446167, "are both opposed to the formation of such views and habits as we think desirable to the citizen of the new world we answer first with regard to those who have grown up in another land and who soon after arriving here are engaged in our service"], ["15", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Above which we have formed ourselves these premises as we might consider them to a citizen of the whole world, and answer first with regard to those who have grown up in another land and who soon after arriving here are engaged in our service.<|im_end|>", -0.029811272397637367, 1.3287962675094604, "are both opposed to the formation of such views and habits as we think desirable to the citizen of the new world we answer first with regard to those who have grown up in another land and who soon after arriving here are engaged in our service"], ["15", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Our obligations to the colonies of these islands, as we might consider them to a citizen of our own world, increase in force with regard to those who have grown up in another land and who soon after arriving here are engaged in our service.<|im_end|>", -0.03507249057292938, 1.292396068572998, "are both opposed to the formation of such views and habits as we think desirable to the citizen of the new world we answer first with regard to those who have grown up in another land and who soon after arriving here are engaged in our service"], ["15", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Our brotherhood should be formed in such a way as to these matters, as we might conceive it were to a citizen of our own country. The next verse with regard to those who have grown up in another land and who soon after arriving here are engaged in our service.<|im_end|>", -0.4199356734752655, -1.3703200817108154, "are both opposed to the formation of such views and habits as we think desirable to the citizen of the new world we answer first with regard to those who have grown up in another land and who soon after arriving here are engaged in our service"], ["15", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>For seeing my weakly temper, said missus clark's manager of her daughter ashamed that she helped hide the poverty of her child in all the grand qualities which she herself possessed unconsciously and which she set so high a value upon with others.<|im_end|>", 0.046360768377780914, 0.4103975296020508, "which the uneasy tenderness of missus thornton's manner to her daughter the shame with which she thought to hide the poverty of her child in all the grand qualities which she herself possessed unconsciously and which she set so high a value upon in others"], ["15", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>For steam, with easy tenderness said missus sloan's manager of her daughter ashamed that she helped hide the poverty of her child in all the grander qualities which she herself possessed unconsciously and which she set so high a value upon with others.<|im_end|>", 0.05154683068394661, 0.44836360216140747, "which the uneasy tenderness of missus thornton's manner to her daughter the shame with which she thought to hide the poverty of her child in all the grand qualities which she herself possessed unconsciously and which she set so high a value upon in others"], ["15", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>For seeing my really tender and sympathetic ways of managing her daughter, ashamed that she helped to hide the poverty of her child in all the grander qualities which she herself possessed unconsciously and which she set so high a value upon with others.<|im_end|>", -0.11499068140983582, -0.7708224654197693, "which the uneasy tenderness of missus thornton's manner to her daughter the shame with which she thought to hide the poverty of her child in all the grand qualities which she herself possessed unconsciously and which she set so high a value upon in others"], ["15", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>For Stephen, easily tender said missus holmes managed her daughter ashamed that she helped to hide the poverty of her child in all the grander qualities which she herself possessed unconsciously and which she set so high a value upon with others.<|im_end|>", 0.10173752903938293, 0.8157991170883179, "which the uneasy tenderness of missus thornton's manner to her daughter the shame with which she thought to hide the poverty of her child in all the grand qualities which she herself possessed unconsciously and which she set so high a value upon in others"], ["15", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>for she had a really tender sense of missus holmes's management of her daughter ashamed that she helped to hide the poverty of her child in all the grander qualities which she herself possessed unconsciously and which she set so high a value upon with others<|im_end|>", 0.06310267001390457, 0.5329614281654358, "which the uneasy tenderness of missus thornton's manner to her daughter the shame with which she thought to hide the poverty of her child in all the grand qualities which she herself possessed unconsciously and which she set so high a value upon in others"], ["15", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>For seeing my really tender, said missus clark's manner to her daughter the shame with which she helped hide the poverty of her child in all the grander qualities that she herself possessed unconsciously and which she set so high a value upon with others.<|im_end|>", 0.2842099964618683, 2.151641607284546, "which the uneasy tenderness of missus thornton's manner to her daughter the shame with which she thought to hide the poverty of her child in all the grand qualities which she herself possessed unconsciously and which she set so high a value upon in others"], ["15", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>For she had a really tenderness of disposition and management for her daughter, ashamed that she helped to hide the poverty of her child in all the grand qualities which she herself possessed unconsciously, and which she set so high a value upon with others.<|im_end|>", -0.01078671682626009, -0.007967192679643631, "which the uneasy tenderness of missus thornton's manner to her daughter the shame with which she thought to hide the poverty of her child in all the grand qualities which she herself possessed unconsciously and which she set so high a value upon in others"], ["15", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>For she had a really tender sense of Mrs holmes's management of her daughter, ashamed that she helped to hide the poverty of her child in all the grand qualities which she herself possessed unconsciously and which she set so high a value upon with others.<|im_end|>", -0.11140192300081253, -0.7445499300956726, "which the uneasy tenderness of missus thornton's manner to her daughter the shame with which she thought to hide the poverty of her child in all the grand qualities which she herself possessed unconsciously and which she set so high a value upon in others"], ["15", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>For she had a really tender sense of mrs fleming's management of her daughter, ashamed that she helped to hide the poverty of her child in all the grander qualities which she herself possessed unconsciously and which she set so high a value upon with others.<|im_end|>", -0.18237683176994324, -1.2641422748565674, "which the uneasy tenderness of missus thornton's manner to her daughter the shame with which she thought to hide the poverty of her child in all the grand qualities which she herself possessed unconsciously and which she set so high a value upon in others"], ["15", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>For steam and breathing temperance said missus fleming's manager her daughter ashamed that she helped hide the poverty of her child in all the grander qualities which she herself possessed unconsciously at first she set so high a value upon the pleasures<|box_start|><|im_end|>", -0.16693364083766937, -1.1510859727859497, "which the uneasy tenderness of missus thornton's manner to her daughter the shame with which she thought to hide the poverty of her child in all the grand qualities which she herself possessed unconsciously and which she set so high a value upon in others"], ["15", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>For she had a pleasing temper, said missus holmes's manager of her daughter, ashamed that she helped to hide the poverty of her child in all the grander qualities which she herself possessed unconsciously and which she set so high a value upon with others.<|im_end|>", -0.12878626585006714, -0.8718170523643494, "which the uneasy tenderness of missus thornton's manner to her daughter the shame with which she thought to hide the poverty of her child in all the grand qualities which she herself possessed unconsciously and which she set so high a value upon in others"], ["15", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>For she had a pleasing temper, said missus holmes's manager of her daughter ashamed that she helped to hide the poverty of her child in all the grand qualities which she herself possessed unconsciously and which she set so high a value upon with others.<|im_end|>", 0.05193726718425751, 0.45122188329696655, "which the uneasy tenderness of missus thornton's manner to her daughter the shame with which she thought to hide the poverty of her child in all the grand qualities which she herself possessed unconsciously and which she set so high a value upon in others"], ["15", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>And had promised to enter the eternal city in my next episcopal abbatial name.<|im_end|>", -0.288534939289093, 0.34273386001586914, "And had promised to lend her the eternal city and my recipe for rabbit mayonnaise."], ["15", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>And had promised to enter the eternal city in my nephew's behalf at mayonnaise.<|im_end|>", -0.062477611005306244, 1.5248231887817383, "And had promised to lend her the eternal city and my recipe for rabbit mayonnaise."], ["15", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>And had promised to enter the eternal city in my own sepulchre, provided me a name.<|im_end|>", -0.6080390810966492, -1.3280036449432373, "And had promised to lend her the eternal city and my recipe for rabbit mayonnaise."], ["15", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>And had promised to enter the eternal city and martyrship provided me a name.<|im_end|>", -0.28105244040489197, 0.38186103105545044, "And had promised to lend her the eternal city and my recipe for rabbit mayonnaise."], ["15", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>And had promised to enter the eternal city in my embassy provided me a name.<|im_end|>", -0.4495788514614105, -0.4993901252746582, "And had promised to lend her the eternal city and my recipe for rabbit mayonnaise."], ["15", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>And had promised to enter the eternal city in my nephew's behalf at mayonnaise.<|im_end|>", -0.062477611005306244, 1.5248231887817383, "And had promised to lend her the eternal city and my recipe for rabbit mayonnaise."], ["15", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>And had promised to enter the eternal city and martyrship provided me a name.<|im_end|>", -0.28105244040489197, 0.38186103105545044, "And had promised to lend her the eternal city and my recipe for rabbit mayonnaise."], ["15", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>And had promised to enter the eternal city in my next episcopal visit made there.<|im_end|>", -0.4480052590370178, -0.4911615550518036, "And had promised to lend her the eternal city and my recipe for rabbit mayonnaise."], ["15", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>And had promised to enter the eternal city and martyrship provided me a name.<|im_end|>", -0.28105244040489197, 0.38186103105545044, "And had promised to lend her the eternal city and my recipe for rabbit mayonnaise."], ["15", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>And had promised to enter the eternal city in my next epistle that it may remain.<|im_end|>", -0.6017347574234009, -1.2950372695922852, "And had promised to lend her the eternal city and my recipe for rabbit mayonnaise."], ["15", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>And had promised to enter the eternal city and martyrship provided me a name.<|im_end|>", -0.28105244040489197, 0.38186103105545044, "And had promised to lend her the eternal city and my recipe for rabbit mayonnaise."], ["15", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>And had promised to enter the eternal city in my nephew's behalf at many a name.<|im_end|>", -0.6038755774497986, -1.30623197555542, "And had promised to lend her the eternal city and my recipe for rabbit mayonnaise."]]}
|
wandb/run-20260417_123237-3h84yfea/files/media/table/completions_9_ec21142175e3781c9ddd.table.json
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"columns": ["step", "prompt", "completion", "ASRWerSubLenCmpHalluDirtyV56", "advantages", "solution"], "data": [["20", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>We looked upon them and we laughed, and said fear nothing my brothers, there is a great power in these wires but this power is tamed it is yours we give it to you still they would not move.<|im_end|>", 0.7686349749565125, 0.5085489153862, "we looked upon them and we laughed and said fear nothing our brothers there is a great power in these wires but this power is tamed it is yours we give it to you still they would not move"], ["20", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>We looked upon them and we laughed, and said fear nothing my brothers there is a great power in these wires but this power is tamed it is yours we give it to you still they would not move.<|im_end|>", 0.8261563181877136, 0.8900229930877686, "we looked upon them and we laughed and said fear nothing our brothers there is a great power in these wires but this power is tamed it is yours we give it to you still they would not move"], ["20", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>We looked upon them and we laughed, and said fear nothing my brothers, there is a great power in these wires, but this power is tamed. It is yours. We give it to you still they would not move.<|im_end|>", 0.5813714861869812, -0.7333583831787109, "we looked upon them and we laughed and said fear nothing our brothers there is a great power in these wires but this power is tamed it is yours we give it to you still they would not move"], ["20", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>We looked upon them and we laughed, and said fear nothing my brothers there is a great power in these wires but this power is tamed it is yours we give it to you still they would not move.<|im_end|>", 0.8261563181877136, 0.8900229930877686, "we looked upon them and we laughed and said fear nothing our brothers there is a great power in these wires but this power is tamed it is yours we give it to you still they would not move"], ["20", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>We looked upon them and we laughed, and said fear nothing my brothers there is a great power in these wires but this power is tamed it is yours we give it to you still they would not move.<|im_end|>", 0.8261563181877136, 0.8900229930877686, "we looked upon them and we laughed and said fear nothing our brothers there is a great power in these wires but this power is tamed it is yours we give it to you still they would not move"], ["20", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>We looked upon them and we laughed, and said fear nothing my brothers, there is a great power in these wilds, but this power is tamed. It is yours. We give it to you still they would not move.<|im_end|>", 0.5788635611534119, -0.7499906420707703, "we looked upon them and we laughed and said fear nothing our brothers there is a great power in these wires but this power is tamed it is yours we give it to you still they would not move"], ["20", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>We looked upon them and we laughed, and said, fear nothing, my brothers. There is a great power in these wires, but this power is tamed. It is yours. We give it to you still they would not move.<|im_end|>", 0.4414002299308777, -1.6616296768188477, "we looked upon them and we laughed and said fear nothing our brothers there is a great power in these wires but this power is tamed it is yours we give it to you still they would not move"], ["20", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>We looked upon them and we laughed, and said, fear nothing my brothers, there is a great power in these wires but this power is tamed it is yours, we give it to you still they would not move.<|im_end|>", 0.6516913175582886, -0.26700636744499207, "we looked upon them and we laughed and said fear nothing our brothers there is a great power in these wires but this power is tamed it is yours we give it to you still they would not move"], ["20", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>We looked upon them and we laughed, and said fear nothing my brothers there is a great power in these wires but this power is tamed it is yours we give it to you still they would not move.<|im_end|>", 0.8261563181877136, 0.8900229930877686, "we looked upon them and we laughed and said fear nothing our brothers there is a great power in these wires but this power is tamed it is yours we give it to you still they would not move"], ["20", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>We looked upon them and we laughed, and said fear nothing, my brothers, there is a great power in these wires but this power is tamed it is yours we give it to you still they would not move.<|im_end|>", 0.7117764949798584, 0.13147078454494476, "we looked upon them and we laughed and said fear nothing our brothers there is a great power in these wires but this power is tamed it is yours we give it to you still they would not move"], ["20", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>We looked upon them and we laughed, and said fear nothing my brothers there is a great power in these wires but this power is tamed it is yours we give it to you still they would not move.<|im_end|>", 0.8261563181877136, 0.8900229930877686, "we looked upon them and we laughed and said fear nothing our brothers there is a great power in these wires but this power is tamed it is yours we give it to you still they would not move"], ["20", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>We looked upon them and we laughed, and said, fear nothing, my brothers. There is a great power in these wilds, but this power is tamed. It is yours. We give it to you still they would not move.<|im_end|>", 0.43890881538391113, -1.6781524419784546, "we looked upon them and we laughed and said fear nothing our brothers there is a great power in these wires but this power is tamed it is yours we give it to you still they would not move"], ["20", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>At such a moment, this yet undiscovered and peculiar world was in no ordinary shape, setting in motion incalculable weapons of force and agencies for the first time man had command of his native supply of electricity without thought or effort.<|im_end|>", -0.12373896688222885, 0.08507958054542542, "at such a moment this gift of despoiled italy to the world was a noble revenge setting in motion incalculable beneficent forces and agencies for the first time man had command of a steady supply of electricity without toil or effort"], ["20", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>At such a moment, this yet undiscovered and peculiar world was in no words of change setting in motion incalculable weapons and forces and agencies for the first time man had command of his daily supply of electricity without trouble or effort.<|im_end|>", -0.1656464785337448, -0.35089585185050964, "at such a moment this gift of despoiled italy to the world was a noble revenge setting in motion incalculable beneficent forces and agencies for the first time man had command of a steady supply of electricity without toil or effort"], ["20", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>At such a moment, this yet undiscovered and peculiar world was in no ordinary shape, setting in motion incalculable weapons and forces and agencies for the first time man had command of his native supply of electricity without thought or effort.<|im_end|>", -0.054759737104177475, 0.8026895523071289, "at such a moment this gift of despoiled italy to the world was a noble revenge setting in motion incalculable beneficent forces and agencies for the first time man had command of a steady supply of electricity without toil or effort"], ["20", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>At such a moment, this yet undiscovered and peculiar world was in no ordinary chair setting in motion incalculable weapons of force and agencies for the first time man had command of his native supply of electricity without thought or effort.<|im_end|>", -0.12419147044420242, 0.08037205785512924, "at such a moment this gift of despoiled italy to the world was a noble revenge setting in motion incalculable beneficent forces and agencies for the first time man had command of a steady supply of electricity without toil or effort"], ["20", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>At such a moment, this yet undiscovered and peculiar world was in no way diminished, setting in motion incalculable weapons and forces and agencies for the first time man had command of his daily supply of electricity without thought or effort.<|im_end|>", -0.05371581390500069, 0.8135498762130737, "at such a moment this gift of despoiled italy to the world was a noble revenge setting in motion incalculable beneficent forces and agencies for the first time man had command of a steady supply of electricity without toil or effort"], ["20", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>At such a moment, this yet undiscovered and peculiar world was in no little danger, setting in motion incalculable weapons of force and agencies for the first time man had command over things supplied with electricity without thought or effort.<|im_end|>", -0.3379965126514435, -2.1439008712768555, "at such a moment this gift of despoiled italy to the world was a noble revenge setting in motion incalculable beneficent forces and agencies for the first time man had command of a steady supply of electricity without toil or effort"], ["20", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>At such a moment, this vehicle of the mechanical world was in no other language setting in motion incalculable weapons and forces and agencies for the first time man had command of his native supply of electricity without thought or effort.<|im_end|>", 0.018295863643288612, 1.5627073049545288, "at such a moment this gift of despoiled italy to the world was a noble revenge setting in motion incalculable beneficent forces and agencies for the first time man had command of a steady supply of electricity without toil or effort"], ["20", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>At such a moment, this yet undiscovered and peculiar world was in no ordinary shape, setting in motion incalculable weapons of force and agencies for the first time man had command of his native supply of electricity without thought or effort.<|im_end|>", -0.12373896688222885, 0.08507958054542542, "at such a moment this gift of despoiled italy to the world was a noble revenge setting in motion incalculable beneficent forces and agencies for the first time man had command of a steady supply of electricity without toil or effort"], ["20", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>At such a moment, this yet undiscovered and familiar world was in no ordinary shape, setting in motion incalculable weapons of force and agencies. For the first time man had command of his daily supply of electricity without trouble or effort.<|im_end|>", -0.19637031853199005, -0.6705244779586792, "at such a moment this gift of despoiled italy to the world was a noble revenge setting in motion incalculable beneficent forces and agencies for the first time man had command of a steady supply of electricity without toil or effort"], ["20", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>At such a moment, this yet undiscovered and familiar world was in no ordinary shape, setting in motion incalculable weapons and forces and agencies for the first time man had command of his native supply of electricity without thought or effort.<|im_end|>", -0.053767330944538116, 0.8130138516426086, "at such a moment this gift of despoiled italy to the world was a noble revenge setting in motion incalculable beneficent forces and agencies for the first time man had command of a steady supply of electricity without toil or effort"], ["20", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>At such a moment, this yet undiscovered and peculiar world was in no ordinary shape setting in motion incalculable weapons of force and agencies for the first time man had command of his native supply of electricity without thought or effort.<|im_end|>", -0.12297827005386353, 0.09299331903457642, "at such a moment this gift of despoiled italy to the world was a noble revenge setting in motion incalculable beneficent forces and agencies for the first time man had command of a steady supply of electricity without toil or effort"], ["20", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>At such a moment, this yet undiscovered and familiar world was in no word of language setting in motion incalculable weapons of force and agencies for the first time man had command of his native supply of electricity without thought or effort.<|im_end|>", -0.24439725279808044, -1.1701619625091553, "at such a moment this gift of despoiled italy to the world was a noble revenge setting in motion incalculable beneficent forces and agencies for the first time man had command of a steady supply of electricity without toil or effort"], ["20", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>He repeated and they're dashed out of the turnpike splendid span black horses attached to a carriage having long run s r s in gilt letters on the fender at the door two girls stepped up in the car with the carriage the old woman had entered and taken her seat<|im_end|>", 0.19381928443908691, 0.380490243434906, "he repeated and there dashed up to the curb a splendid span of black horses attached to a carriage having the monogram c r s in gilt letters on the panel of the door two girls stepped out of the crowd towards the carriage the older one had entered and taken her seat"], ["20", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>He repeated, and there dashed out of the nursery a splendid span black horses attached to a carriage having long written c r s in gilt letters on the handle of that order two girls stepped out at the car window with the carriage, the old woman had entered and taken her seat.<|im_end|>", 0.14365018904209137, -0.12923574447631836, "he repeated and there dashed up to the curb a splendid span of black horses attached to a carriage having the monogram c r s in gilt letters on the panel of the door two girls stepped out of the crowd towards the carriage the older one had entered and taken her seat"], ["20", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>He repeated, and there dashed after them a splendid span of black horses attached to a carriage having long written c r s in gilt letters on the fanlight door two girls stepped out at the front door with the carriage. The old woman had entered, taken her seat.<|im_end|>", 0.05467502027750015, -1.0332376956939697, "he repeated and there dashed up to the curb a splendid span of black horses attached to a carriage having the monogram c r s in gilt letters on the panel of the door two girls stepped out of the crowd towards the carriage the older one had entered and taken her seat"], ["20", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>He repeated and they're dashed out into the nursery as a splendid span of black horses attached to a carriage having long running c r s in gilt letters on the fender at the door two girls stepped out of the car with the carriage, the old woman had entered and taken her seat.<|im_end|>", 0.294100284576416, 1.399361252784729, "he repeated and there dashed up to the curb a splendid span of black horses attached to a carriage having the monogram c r s in gilt letters on the panel of the door two girls stepped out of the crowd towards the carriage the older one had entered and taken her seat"], ["20", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>He repeated and they're dashed out of the nursery a splendid span black horses attached to a carriage having long running c r s in gilt letters on the front of that order two girls stepped up into the crowded rear of the carriage, the old woman had entered taking her seat.<|im_end|>", -0.00651371106505394, -1.654924988746643, "he repeated and there dashed up to the curb a splendid span of black horses attached to a carriage having the monogram c r s in gilt letters on the panel of the door two girls stepped out of the crowd towards the carriage the older one had entered and taken her seat"], ["20", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>He repeated, and there dashed out through the nursery a splendid span of black horses attached to a carriage having long red c r s in gilt letters on the handle at the door. Two girls stepped up to the carriageway with the carriage. The old woman had entered and taken her seat.<|im_end|>", 0.1829727590084076, 0.2702878415584564, "he repeated and there dashed up to the curb a splendid span of black horses attached to a carriage having the monogram c r s in gilt letters on the panel of the door two girls stepped out of the crowd towards the carriage the older one had entered and taken her seat"], ["20", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>He repeated, and they're dashed up through the turnpike splendid span of black horses attached to a carriage having long running c r s in gilt letters on the fan of that order two girls stepped out into the crowd towards the carriage, the old woman had entered and taken her seat.<|im_end|>", 0.2951398491859436, 1.4099233150482178, "he repeated and there dashed up to the curb a splendid span of black horses attached to a carriage having the monogram c r s in gilt letters on the panel of the door two girls stepped out of the crowd towards the carriage the older one had entered and taken her seat"], ["20", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>He repeated and they're dashed out into the nursery, a splendid span of black horses attached to a carriage having long running c r s in gilt letters on the fender at the door. Two girls stepped out in the corral towards the carriage. The old woman had entered and taken her seat.<|im_end|>", 0.28599315881729126, 1.3169915676116943, "he repeated and there dashed up to the curb a splendid span of black horses attached to a carriage having the monogram c r s in gilt letters on the panel of the door two girls stepped out of the crowd towards the carriage the older one had entered and taken her seat"], ["20", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>He repeated, and there dashed out of the nursery a splendid span of black horses attached to a carriage having long running s r s in gilt letters on the front of that order two girls stepped up into the rear end of the carriage, the old woman had entered and taken her seat.<|im_end|>", 0.08877895027399063, -0.6867362856864929, "he repeated and there dashed up to the curb a splendid span of black horses attached to a carriage having the monogram c r s in gilt letters on the panel of the door two girls stepped out of the crowd towards the carriage the older one had entered and taken her seat"], ["20", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>He repeated, and there dashed out of the nursery a splendid span black horses attached to a carriage having on the bonnet c r s in gilt letters on a fan flap door two girls stepped up to the crowd around the carriage. The old woman had entered and taken her seat.<|im_end|>", 0.15423451364040375, -0.021697325631976128, "he repeated and there dashed up to the curb a splendid span of black horses attached to a carriage having the monogram c r s in gilt letters on the panel of the door two girls stepped out of the crowd towards the carriage the older one had entered and taken her seat"], ["20", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>He repeated and they're dashed out of the nursery with a splendid span of black horses attached to a carriage having long running c r s in gilt letters on the front of that order two girls stepped up at the garaband door of the carriage, the old woman had entered and taken her seat.<|im_end|>", 0.09735386073589325, -0.5996138453483582, "he repeated and there dashed up to the curb a splendid span of black horses attached to a carriage having the monogram c r s in gilt letters on the panel of the door two girls stepped out of the crowd towards the carriage the older one had entered and taken her seat"], ["20", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>He repeated and they're dashed out of the nursery, splendid span black horses attached to a carriage having long running c r s in gilt letters on the fan flap door two girls stepped up into the carriagewith the old woman had entered and taken her seat<|im_end|>", 0.09223616868257523, -0.6516103744506836, "he repeated and there dashed up to the curb a splendid span of black horses attached to a carriage having the monogram c r s in gilt letters on the panel of the door two girls stepped out of the crowd towards the carriage the older one had entered and taken her seat"], ["20", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>The young inventor turned his face aside and then glanced round the dark barn in alarm. The cat pushed out from behind him with a great low paw between its jaws, and it was ugly. Sh sh said a low murmur of whisper.<|im_end|>", -1.1028889417648315, -0.7121061682701111, "They looked into each other's frightened faces, and then glanced around the dark barn in alarm. An old cap pushed up through the hay. Then a weak little cough betrayed jonesy. He had followed them. Sh he said in a warning whisper."], ["20", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>And looked into each other's frightened faces, and then glanced round the dark barn in alarm. He pushed up his collar with a great low cough between jerks of breath, and held out his hand. Sh sh said an old woman whispering.<|im_end|>", -0.6284806728363037, 1.885280966758728, "They looked into each other's frightened faces, and then glanced around the dark barn in alarm. An old cap pushed up through the hay. Then a weak little cough betrayed jonesy. He had followed them. Sh he said in a warning whisper."], ["20", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Then he leaned over to his sister, and they kissed again, and then glanced round the dark barn in the mar. Cuthbert's head fell, and a great blow passed between them. And it was heavy, sh she said aloud with a whisper.<|im_end|>", -1.1564602851867676, -1.0054094791412354, "They looked into each other's frightened faces, and then glanced around the dark barn in alarm. An old cap pushed up through the hay. Then a weak little cough betrayed jonesy. He had followed them. Sh he said in a warning whisper."], ["20", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>The little angel just stared at his feet, and then glanced round the dark barn in alarm. He pushed up his heels with a great blow, caught betwixt arm and leg, and had hardly been shuffling on the floor when he whispered.<|im_end|>", -1.1646636724472046, -1.0503231287002563, "They looked into each other's frightened faces, and then glanced around the dark barn in alarm. An old cap pushed up through the hay. Then a weak little cough betrayed jonesy. He had followed them. Sh he said in a warning whisper."], ["20", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>The little angel touched his great white face and then glanced round the dark barn in alarm, pushed up from under it with a great blow of paws that dragged him back again. And he had said something sh she flamed out a whisper.<|im_end|>", -1.1615231037139893, -1.0331284999847412, "They looked into each other's frightened faces, and then glanced around the dark barn in alarm. An old cap pushed up through the hay. Then a weak little cough betrayed jonesy. He had followed them. Sh he said in a warning whisper."], ["20", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Then he looked into each of the three faces and then glanced round the dark barn in alarm, pushed out his head and with great little hops retreated joyfully away from the room sh she said a murmur whispered.<|im_end|>", -0.9255474805831909, 0.2588390111923218, "They looked into each other's frightened faces, and then glanced around the dark barn in alarm. An old cap pushed up through the hay. Then a weak little cough betrayed jonesy. He had followed them. Sh he said in a warning whisper."], ["20", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>The little angel just stared at his hand and then glanced round the dark barn in alarm, pushed up her hood and a great low cough betrayed joy and fear. Sh sh sh said another voice.<|im_end|>", -0.9503790140151978, 0.12288626283407211, "They looked into each other's frightened faces, and then glanced around the dark barn in alarm. An old cap pushed up through the hay. Then a weak little cough betrayed jonesy. He had followed them. Sh he said in a warning whisper."], ["20", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>And looked into each other's frightened faces, and then glanced round the dark barn in alarm. Pritchett quickly hid his great blue paws between his arms, and he did a little bit sh sh said a low voice.<|im_end|>", -0.6836804151535034, 1.5830621719360352, "They looked into each other's frightened faces, and then glanced around the dark barn in alarm. An old cap pushed up through the hay. Then a weak little cough betrayed jonesy. He had followed them. Sh he said in a warning whisper."], ["20", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>And looking down at his frightened face, and then glanced round the dark barn in alarm. He pushed up slowly from a great low cask between two walls and looked wildly around him. Sh said another voice.<|im_end|>", -0.9896582961082458, -0.09216795861721039, "They looked into each other's frightened faces, and then glanced around the dark barn in alarm. An old cap pushed up through the hay. Then a weak little cough betrayed jonesy. He had followed them. Sh he said in a warning whisper."], ["20", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>The little angel just stared at her and then glanced round the dark barn in alarm, but pushed up quickly when a great blow passed between the two men. And it was somebody sh said another voice.<|im_end|>", -1.0897308588027954, -0.640065610408783, "They looked into each other's frightened faces, and then glanced around the dark barn in alarm. An old cap pushed up through the hay. Then a weak little cough betrayed jonesy. He had followed them. Sh he said in a warning whisper."], ["20", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>And looked into each of the great windows, and then glanced round the dark barn in the yard. He pushed up his sleeve, and with a great low cough betrayed joy, and asked happily shh, said another voice quietly.<|im_end|>", -0.8186123371124268, 0.8443093299865723, "They looked into each other's frightened faces, and then glanced around the dark barn in alarm. An old cap pushed up through the hay. Then a weak little cough betrayed jonesy. He had followed them. Sh he said in a warning whisper."], ["20", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>And looking down at his frightened face again, and then glanced round the dark barn in alarm. He pushed up slowly from the great low cask between two old men. And he saw a blue moon sh she said no one whispered.<|im_end|>", -1.0022618770599365, -0.16117261350154877, "They looked into each other's frightened faces, and then glanced around the dark barn in alarm. An old cap pushed up through the hay. Then a weak little cough betrayed jonesy. He had followed them. Sh he said in a warning whisper."]]}
|
wandb/run-20260417_123237-3h84yfea/files/output.log
ADDED
|
@@ -0,0 +1,326 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
wandb: Detected [openai] in use.
|
| 2 |
+
wandb: Use W&B Weave for improved LLM call tracing. Install Weave with `pip install weave` then add `import weave` to the top of your script.
|
| 3 |
+
wandb: For more information, check out the docs at: https://weave-docs.wandb.ai/
|
| 4 |
+
Train: 0%| | 0/9327 [00:00<?, ?it/s]Could not estimate the number of tokens of the input, floating-point operations will not be computed
|
| 5 |
+
[DEBUG generate] shape= (24, 245) last_col_pad_cnt= 0 first_col_pad_cnt= 12
|
| 6 |
+
[DEBUG _encode] has_resp= True prompt_len= 245 resp_len= 53 full_len= 298 label_non_ignore= 53
|
| 7 |
+
[DEBUG _encode] has_resp= True prompt_len= 245 resp_len= 56 full_len= 301 label_non_ignore= 56
|
| 8 |
+
[DEBUG _encode] has_resp= True prompt_len= 245 resp_len= 52 full_len= 297 label_non_ignore= 52
|
| 9 |
+
[DEBUG _encode] has_resp= True prompt_len= 245 resp_len= 53 full_len= 298 label_non_ignore= 53
|
| 10 |
+
[DEBUG _encode] has_resp= True prompt_len= 245 resp_len= 58 full_len= 303 label_non_ignore= 58
|
| 11 |
+
[DEBUG _encode] has_resp= True prompt_len= 245 resp_len= 55 full_len= 300 label_non_ignore= 55
|
| 12 |
+
[DEBUG _encode] has_resp= True prompt_len= 245 resp_len= 56 full_len= 301 label_non_ignore= 56
|
| 13 |
+
[DEBUG _encode] has_resp= True prompt_len= 245 resp_len= 61 full_len= 306 label_non_ignore= 61
|
| 14 |
+
[DEBUG _encode] has_resp= True prompt_len= 245 resp_len= 55 full_len= 300 label_non_ignore= 55
|
| 15 |
+
[DEBUG _encode] has_resp= True prompt_len= 245 resp_len= 50 full_len= 295 label_non_ignore= 50
|
| 16 |
+
[DEBUG generate] shape= (24, 245) last_col_pad_cnt= 0 first_col_pad_cnt= 12
|
| 17 |
+
[DEBUG generate] shape= (24, 235) last_col_pad_cnt= 0 first_col_pad_cnt= 12
|
| 18 |
+
[DEBUG generate] shape= (24, 235) last_col_pad_cnt= 0 first_col_pad_cnt= 12
|
| 19 |
+
[DEBUG generate] shape= (24, 249) last_col_pad_cnt= 0 first_col_pad_cnt= 12
|
| 20 |
+
Train: 0%| | 8/9327 [07:40<146:43:24, 56.68s/it]
|
| 21 |
+
{'loss': 0.00064715, 'grad_norm': 0.43327886, 'learning_rate': 1.8e-07, 'completions/mean_length': 48.90104294, 'completions/min_length': 35.25, 'completions/max_length': 61.25, 'completions/clipped_ratio': 0.0, 'reward': -0.42871299, 'reward_std': 0.16135792, 'frac_reward_zero_std': 0.0, 'rewards/ASRWerSubLenCmpHalluDirtyV56/mean': -0.42871299, 'rewards/ASRWerSubLenCmpHalluDirtyV56/std': 0.28526043, 'kl': 0.0, 'clip_ratio/low_mean': 0.0, 'clip_ratio/low_min': 0.0, 'clip_ratio/high_mean': 0.0, 'clip_ratio/high_max': 0.0, 'clip_ratio/region_mean': 0.0, 'step_time': 32.50056268, 'epoch': 0.0, 'global_step/max_steps': '1/9327', 'elapsed_time': '1m 5s', 'remaining_time': '7d 1h 23m 55s', 'memory(GiB)': 7.93, 'train_speed(s/it)': 65.390893}
|
| 22 |
+
[DEBUG generate] shape= (24, 250) last_col_pad_cnt= 0 first_col_pad_cnt= 0
|
| 23 |
+
[DEBUG generate] shape= (24, 250) last_col_pad_cnt= 0 first_col_pad_cnt= 0
|
| 24 |
+
[DEBUG generate] shape= (24, 226) last_col_pad_cnt= 0 first_col_pad_cnt= 12
|
| 25 |
+
[DEBUG generate] shape= (24, 226) last_col_pad_cnt= 0 first_col_pad_cnt= 12
|
| 26 |
+
[DEBUG generate] shape= (24, 249) last_col_pad_cnt= 0 first_col_pad_cnt= 12
|
| 27 |
+
[DEBUG generate] shape= (24, 249) last_col_pad_cnt= 0 first_col_pad_cnt= 12
|
| 28 |
+
[DEBUG generate] shape= (24, 255) last_col_pad_cnt= 0 first_col_pad_cnt= 12
|
| 29 |
+
[DEBUG generate] shape= (24, 255) last_col_pad_cnt= 0 first_col_pad_cnt= 12
|
| 30 |
+
[DEBUG generate] shape= (24, 257) last_col_pad_cnt= 0 first_col_pad_cnt= 12
|
| 31 |
+
[DEBUG generate] shape= (24, 257) last_col_pad_cnt= 0 first_col_pad_cnt= 12
|
| 32 |
+
[DEBUG generate] shape= (24, 244) last_col_pad_cnt= 0 first_col_pad_cnt= 12
|
| 33 |
+
[DEBUG generate] shape= (24, 244) last_col_pad_cnt= 0 first_col_pad_cnt= 12
|
| 34 |
+
[DEBUG generate] shape= (24, 253) last_col_pad_cnt= 0 first_col_pad_cnt= 12
|
| 35 |
+
[DEBUG generate] shape= (24, 253) last_col_pad_cnt= 0 first_col_pad_cnt= 12
|
| 36 |
+
[DEBUG generate] shape= (24, 254) last_col_pad_cnt= 0 first_col_pad_cnt= 12
|
| 37 |
+
[DEBUG generate] shape= (24, 254) last_col_pad_cnt= 0 first_col_pad_cnt= 12
|
| 38 |
+
{'loss': 0.00332408, 'grad_norm': 0.37274894, 'learning_rate': 8.9e-07, 'completions/mean_length': 51.19921994, 'completions/min_length': 34.0, 'completions/max_length': 64.6875, 'completions/clipped_ratio': 0.0, 'reward': -0.02796031, 'reward_std': 0.15601904, 'frac_reward_zero_std': 0.0, 'rewards/ASRWerSubLenCmpHalluDirtyV56/mean': -0.02796032, 'rewards/ASRWerSubLenCmpHalluDirtyV56/std': 0.3970435, 'kl': 0.00452624, 'clip_ratio/low_mean': 0.01082122, 'clip_ratio/low_min': 0.0055485, 'clip_ratio/high_mean': 0.00634016, 'clip_ratio/high_max': 0.0085038, 'clip_ratio/region_mean': 0.01716138, 'step_time': 27.27283109, 'epoch': 0.0, 'global_step/max_steps': '5/9327', 'elapsed_time': '4m 49s', 'remaining_time': '6d 5h 27m 51s', 'memory(GiB)': 8.23, 'train_speed(s/it)': 57.720515}
|
| 39 |
+
[DEBUG generate] shape= (24, 256) last_col_pad_cnt= 0 first_col_pad_cnt= 12
|
| 40 |
+
[DEBUG generate] shape= (24, 256) last_col_pad_cnt= 0 first_col_pad_cnt= 12
|
| 41 |
+
[DEBUG generate] shape= (24, 246) last_col_pad_cnt= 0 first_col_pad_cnt= 12
|
| 42 |
+
[DEBUG generate] shape= (24, 246) last_col_pad_cnt= 0 first_col_pad_cnt= 12
|
| 43 |
+
[DEBUG generate] shape= (24, 135) last_col_pad_cnt= 0 first_col_pad_cnt= 12
|
| 44 |
+
[DEBUG generate] shape= (24, 135) last_col_pad_cnt= 0 first_col_pad_cnt= 12
|
| 45 |
+
[DEBUG generate] shape= (24, 225) last_col_pad_cnt= 0 first_col_pad_cnt= 12
|
| 46 |
+
[DEBUG generate] shape= (24, 225) last_col_pad_cnt= 0 first_col_pad_cnt= 12
|
| 47 |
+
[DEBUG generate] shape= (24, 244) last_col_pad_cnt= 0 first_col_pad_cnt= 0
|
| 48 |
+
[DEBUG generate] shape= (24, 244) last_col_pad_cnt= 0 first_col_pad_cnt= 0
|
| 49 |
+
[DEBUG generate] shape= (24, 240) last_col_pad_cnt= 0 first_col_pad_cnt= 12
|
| 50 |
+
[DEBUG generate] shape= (24, 240) last_col_pad_cnt= 0 first_col_pad_cnt= 12
|
| 51 |
+
[DEBUG generate] shape= (24, 244) last_col_pad_cnt= 0 first_col_pad_cnt= 12
|
| 52 |
+
[DEBUG generate] shape= (24, 244) last_col_pad_cnt= 0 first_col_pad_cnt= 12
|
| 53 |
+
[DEBUG generate] shape= (24, 246) last_col_pad_cnt= 0 first_col_pad_cnt= 12
|
| 54 |
+
[DEBUG generate] shape= (24, 246) last_col_pad_cnt= 0 first_col_pad_cnt= 12
|
| 55 |
+
[DEBUG generate] shape= (24, 236) last_col_pad_cnt= 0 first_col_pad_cnt= 12
|
| 56 |
+
[DEBUG generate] shape= (24, 236) last_col_pad_cnt= 0 first_col_pad_cnt= 12
|
| 57 |
+
[DEBUG generate] shape= (24, 238) last_col_pad_cnt= 0 first_col_pad_cnt= 12
|
| 58 |
+
[DEBUG generate] shape= (24, 238) last_col_pad_cnt= 0 first_col_pad_cnt= 12
|
| 59 |
+
{'loss': 0.00474931, 'grad_norm': 0.40048897, 'learning_rate': 1.79e-06, 'completions/mean_length': 51.25104275, 'completions/min_length': 35.8, 'completions/max_length': 65.4, 'completions/clipped_ratio': 0.0, 'reward': -0.01675091, 'reward_std': 0.17052342, 'frac_reward_zero_std': 0.0, 'rewards/ASRWerSubLenCmpHalluDirtyV56/mean': -0.0167509, 'rewards/ASRWerSubLenCmpHalluDirtyV56/std': 0.47662268, 'kl': 0.00584314, 'clip_ratio/low_mean': 0.0141277, 'clip_ratio/low_min': 0.0085519, 'clip_ratio/high_mean': 0.00913547, 'clip_ratio/high_max': 0.01304741, 'clip_ratio/region_mean': 0.02326317, 'step_time': 27.57334645, 'epoch': 0.0, 'global_step/max_steps': '10/9327', 'elapsed_time': '9m 28s', 'remaining_time': '6d 2h 53m 31s', 'memory(GiB)': 8.23, 'train_speed(s/it)': 56.757666}
|
| 60 |
+
[DEBUG generate] shape= (24, 242) last_col_pad_cnt= 0 first_col_pad_cnt= 12
|
| 61 |
+
[DEBUG generate] shape= (24, 242) last_col_pad_cnt= 0 first_col_pad_cnt= 12
|
| 62 |
+
[DEBUG generate] shape= (24, 241) last_col_pad_cnt= 0 first_col_pad_cnt= 0
|
| 63 |
+
[DEBUG generate] shape= (24, 241) last_col_pad_cnt= 0 first_col_pad_cnt= 0
|
| 64 |
+
[DEBUG generate] shape= (24, 245) last_col_pad_cnt= 0 first_col_pad_cnt= 12
|
| 65 |
+
[DEBUG generate] shape= (24, 245) last_col_pad_cnt= 0 first_col_pad_cnt= 12
|
| 66 |
+
[DEBUG generate] shape= (24, 246) last_col_pad_cnt= 0 first_col_pad_cnt= 12
|
| 67 |
+
[DEBUG generate] shape= (24, 246) last_col_pad_cnt= 0 first_col_pad_cnt= 12
|
| 68 |
+
[DEBUG generate] shape= (24, 257) last_col_pad_cnt= 0 first_col_pad_cnt= 12
|
| 69 |
+
[DEBUG generate] shape= (24, 257) last_col_pad_cnt= 0 first_col_pad_cnt= 12
|
| 70 |
+
[DEBUG generate] shape= (24, 252) last_col_pad_cnt= 0 first_col_pad_cnt= 12
|
| 71 |
+
[DEBUG generate] shape= (24, 252) last_col_pad_cnt= 0 first_col_pad_cnt= 12
|
| 72 |
+
[DEBUG generate] shape= (24, 248) last_col_pad_cnt= 0 first_col_pad_cnt= 12
|
| 73 |
+
[DEBUG generate] shape= (24, 248) last_col_pad_cnt= 0 first_col_pad_cnt= 12
|
| 74 |
+
[DEBUG generate] shape= (24, 239) last_col_pad_cnt= 0 first_col_pad_cnt= 12
|
| 75 |
+
[DEBUG generate] shape= (24, 239) last_col_pad_cnt= 0 first_col_pad_cnt= 12
|
| 76 |
+
[DEBUG generate] shape= (24, 247) last_col_pad_cnt= 0 first_col_pad_cnt= 12
|
| 77 |
+
[DEBUG generate] shape= (24, 247) last_col_pad_cnt= 0 first_col_pad_cnt= 12
|
| 78 |
+
[DEBUG generate] shape= (24, 246) last_col_pad_cnt= 0 first_col_pad_cnt= 0
|
| 79 |
+
[DEBUG generate] shape= (24, 246) last_col_pad_cnt= 0 first_col_pad_cnt= 0
|
| 80 |
+
{'loss': 0.00394418, 'grad_norm': 0.42660096, 'learning_rate': 2.68e-06, 'completions/mean_length': 49.16666756, 'completions/min_length': 35.4, 'completions/max_length': 62.85, 'completions/clipped_ratio': 0.0, 'reward': 0.02952445, 'reward_std': 0.14753249, 'frac_reward_zero_std': 0.0, 'rewards/ASRWerSubLenCmpHalluDirtyV56/mean': 0.02952445, 'rewards/ASRWerSubLenCmpHalluDirtyV56/std': 0.38754931, 'kl': 0.00462258, 'clip_ratio/low_mean': 0.01453043, 'clip_ratio/low_min': 0.00974138, 'clip_ratio/high_mean': 0.00804176, 'clip_ratio/high_max': 0.01153084, 'clip_ratio/region_mean': 0.0225722, 'step_time': 26.1855211, 'epoch': 0.0, 'global_step/max_steps': '15/9327', 'elapsed_time': '13m 52s', 'remaining_time': '5d 23h 33m 19s', 'memory(GiB)': 8.25, 'train_speed(s/it)': 55.498132}
|
| 81 |
+
[DEBUG generate] shape= (24, 244) last_col_pad_cnt= 0 first_col_pad_cnt= 12
|
| 82 |
+
[DEBUG generate] shape= (24, 244) last_col_pad_cnt= 0 first_col_pad_cnt= 12
|
| 83 |
+
[DEBUG generate] shape= (24, 253) last_col_pad_cnt= 0 first_col_pad_cnt= 12
|
| 84 |
+
[DEBUG generate] shape= (24, 253) last_col_pad_cnt= 0 first_col_pad_cnt= 12
|
| 85 |
+
[DEBUG generate] shape= (24, 244) last_col_pad_cnt= 0 first_col_pad_cnt= 12
|
| 86 |
+
[DEBUG generate] shape= (24, 244) last_col_pad_cnt= 0 first_col_pad_cnt= 12
|
| 87 |
+
[DEBUG generate] shape= (24, 277) last_col_pad_cnt= 0 first_col_pad_cnt= 12
|
| 88 |
+
[DEBUG generate] shape= (24, 277) last_col_pad_cnt= 0 first_col_pad_cnt= 12
|
| 89 |
+
[DEBUG generate] shape= (24, 236) last_col_pad_cnt= 0 first_col_pad_cnt= 12
|
| 90 |
+
[DEBUG generate] shape= (24, 236) last_col_pad_cnt= 0 first_col_pad_cnt= 12
|
| 91 |
+
[DEBUG generate] shape= (24, 252) last_col_pad_cnt= 0 first_col_pad_cnt= 12
|
| 92 |
+
[DEBUG generate] shape= (24, 252) last_col_pad_cnt= 0 first_col_pad_cnt= 12
|
| 93 |
+
[DEBUG generate] shape= (24, 157) last_col_pad_cnt= 0 first_col_pad_cnt= 12
|
| 94 |
+
[DEBUG generate] shape= (24, 157) last_col_pad_cnt= 0 first_col_pad_cnt= 12
|
| 95 |
+
[DEBUG generate] shape= (24, 252) last_col_pad_cnt= 0 first_col_pad_cnt= 12
|
| 96 |
+
[DEBUG generate] shape= (24, 252) last_col_pad_cnt= 0 first_col_pad_cnt= 12
|
| 97 |
+
[DEBUG generate] shape= (24, 239) last_col_pad_cnt= 0 first_col_pad_cnt= 12
|
| 98 |
+
[DEBUG generate] shape= (24, 239) last_col_pad_cnt= 0 first_col_pad_cnt= 12
|
| 99 |
+
[DEBUG generate] shape= (24, 251) last_col_pad_cnt= 0 first_col_pad_cnt= 12
|
| 100 |
+
[DEBUG generate] shape= (24, 251) last_col_pad_cnt= 0 first_col_pad_cnt= 12
|
| 101 |
+
{'loss': 0.00318602, 'grad_norm': 0.90874422, 'learning_rate': 3.57e-06, 'completions/mean_length': 48.42812653, 'completions/min_length': 30.25, 'completions/max_length': 61.4, 'completions/clipped_ratio': 0.0, 'reward': 0.02232184, 'reward_std': 0.16092061, 'frac_reward_zero_std': 0.0, 'rewards/ASRWerSubLenCmpHalluDirtyV56/mean': 0.02232184, 'rewards/ASRWerSubLenCmpHalluDirtyV56/std': 0.42085464, 'kl': 0.00529333, 'clip_ratio/low_mean': 0.01409527, 'clip_ratio/low_min': 0.00800156, 'clip_ratio/high_mean': 0.00843188, 'clip_ratio/high_max': 0.01220032, 'clip_ratio/region_mean': 0.02252715, 'step_time': 25.72940668, 'epoch': 0.01, 'global_step/max_steps': '20/9327', 'elapsed_time': '18m 13s', 'remaining_time': '5d 21h 15m 45s', 'memory(GiB)': 8.38, 'train_speed(s/it)': 54.641181}
|
| 102 |
+
[DEBUG generate] shape= (8, 245) last_col_pad_cnt= 0 first_col_pad_cnt= 4
|
| 103 |
+
Val: 4%|▍ | 2/53 [00:05<02:08, 2.53s/it][INFO:swift] last_model_checkpoint: None
|
| 104 |
+
[DEBUG generate] shape= (8, 238) last_col_pad_cnt= 0 first_col_pad_cnt= 4
|
| 105 |
+
[DEBUG generate] shape= (8, 249) last_col_pad_cnt= 0 first_col_pad_cnt= 4
|
| 106 |
+
[INFO:swift] best_model_checkpoint: None
|
| 107 |
+
Traceback (most recent call last):
|
| 108 |
+
File "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/lib/python3.10/site-packages/swift/cli/rlhf.py", line 7, in <module>
|
| 109 |
+
rlhf_main()
|
| 110 |
+
File "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/lib/python3.10/site-packages/swift/pipelines/train/rlhf.py", line 243, in rlhf_main
|
| 111 |
+
return SwiftRLHF(args).main()
|
| 112 |
+
File "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/lib/python3.10/site-packages/swift/pipelines/base.py", line 52, in main
|
| 113 |
+
result = self.run()
|
| 114 |
+
File "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/lib/python3.10/site-packages/swift/ray/base.py", line 168, in wrapper
|
| 115 |
+
return func(self, *args, **kwargs)
|
| 116 |
+
File "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/lib/python3.10/site-packages/swift/pipelines/train/sft.py", line 197, in run
|
| 117 |
+
return self.train(trainer)
|
| 118 |
+
File "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/lib/python3.10/site-packages/swift/pipelines/train/sft.py", line 270, in train
|
| 119 |
+
trainer.train(resume_checkpoint)
|
| 120 |
+
File "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/lib/python3.10/site-packages/swift/trainers/mixin.py", line 895, in train
|
| 121 |
+
res = super().train(*args, **kwargs)
|
| 122 |
+
File "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/lib/python3.10/site-packages/transformers/trainer.py", line 2325, in train
|
| 123 |
+
return inner_training_loop(
|
| 124 |
+
File "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/lib/python3.10/site-packages/transformers/trainer.py", line 2756, in _inner_training_loop
|
| 125 |
+
self._maybe_log_save_evaluate(
|
| 126 |
+
File "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/lib/python3.10/site-packages/swift/trainers/mixin.py", line 972, in _maybe_log_save_evaluate
|
| 127 |
+
super()._maybe_log_save_evaluate(tr_loss, *args, **kwargs)
|
| 128 |
+
File "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/lib/python3.10/site-packages/transformers/trainer.py", line 3221, in _maybe_log_save_evaluate
|
| 129 |
+
metrics = self._evaluate(trial, ignore_keys_for_eval)
|
| 130 |
+
File "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/lib/python3.10/site-packages/transformers/trainer.py", line 3170, in _evaluate
|
| 131 |
+
metrics = self.evaluate(ignore_keys=ignore_keys_for_eval)
|
| 132 |
+
File "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/lib/python3.10/site-packages/transformers/trainer.py", line 4489, in evaluate
|
| 133 |
+
output = eval_loop(
|
| 134 |
+
File "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/lib/python3.10/site-packages/swift/rlhf_trainers/grpo_trainer.py", line 1872, in evaluation_loop
|
| 135 |
+
output = super().evaluation_loop(dataloader, *args, **kwargs)
|
| 136 |
+
File "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/lib/python3.10/site-packages/transformers/trainer.py", line 4685, in evaluation_loop
|
| 137 |
+
losses, logits, labels = self.prediction_step(model, inputs, prediction_loss_only, ignore_keys=ignore_keys)
|
| 138 |
+
File "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/lib/python3.10/site-packages/trl/trainer/grpo_trainer.py", line 2293, in prediction_step
|
| 139 |
+
inputs = self._prepare_inputs(inputs)
|
| 140 |
+
File "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/lib/python3.10/site-packages/swift/rlhf_trainers/utils.py", line 607, in wrapper
|
| 141 |
+
return func(self, *args, **kwargs)
|
| 142 |
+
File "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/lib/python3.10/site-packages/swift/rlhf_trainers/grpo_trainer.py", line 208, in _prepare_inputs
|
| 143 |
+
inputs = self._generate_and_score_completions(generation_batch)
|
| 144 |
+
File "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/lib/python3.10/site-packages/swift/rlhf_trainers/utils.py", line 607, in wrapper
|
| 145 |
+
return func(self, *args, **kwargs)
|
| 146 |
+
File "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/lib/python3.10/site-packages/swift/rlhf_trainers/grpo_trainer.py", line 236, in _generate_and_score_completions
|
| 147 |
+
inputs = self._generate_completions(inputs)
|
| 148 |
+
File "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/lib/python3.10/site-packages/swift/rlhf_trainers/grpo_trainer.py", line 222, in _generate_completions
|
| 149 |
+
results = self._infer_single_or_multi_turn(inputs, self.request_config)
|
| 150 |
+
File "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/lib/python3.10/site-packages/swift/rlhf_trainers/rollout_mixin.py", line 733, in _infer_single_or_multi_turn
|
| 151 |
+
rollout_outputs: List[RolloutOutput] = self._rollout(inputs, request_config, is_global_inputs)
|
| 152 |
+
File "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/lib/python3.10/site-packages/swift/rlhf_trainers/rollout_mixin.py", line 697, in _rollout
|
| 153 |
+
rollout_outputs = self._colocate_rollout(inputs, request_config)
|
| 154 |
+
File "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/lib/python3.10/site-packages/swift/rlhf_trainers/rollout_mixin.py", line 1056, in _colocate_rollout
|
| 155 |
+
outputs: List[RolloutOutput] = self._engine_infer(infer_requests=inputs, request_config=request_config)
|
| 156 |
+
File "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/lib/python3.10/site-packages/swift/rlhf_trainers/rollout_mixin.py", line 1077, in _engine_infer
|
| 157 |
+
res = self.engine.infer(infer_requests, request_config, use_tqdm=use_tqdm)
|
| 158 |
+
File "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/lib/python3.10/site-packages/swift/infer_engine/transformers_engine.py", line 577, in infer
|
| 159 |
+
res += self._infer(infer_requests_samples, request_config, adapter_request=adapter_request)
|
| 160 |
+
File "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/lib/python3.10/site-packages/torch/utils/_contextlib.py", line 116, in decorate_context
|
| 161 |
+
return func(*args, **kwargs)
|
| 162 |
+
File "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/lib/python3.10/site-packages/swift/infer_engine/transformers_engine.py", line 546, in _infer
|
| 163 |
+
res = infer_func(**kwargs)
|
| 164 |
+
File "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/lib/python3.10/site-packages/swift/infer_engine/transformers_engine.py", line 397, in _infer_full
|
| 165 |
+
output = dict(self.template.generate(self.model, **generate_kwargs))
|
| 166 |
+
File "/mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/0416upload/my_qwen3_asr_dapo_register.py", line 670, in generate
|
| 167 |
+
return super().generate(model, *args, **kwargs)
|
| 168 |
+
File "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/lib/python3.10/site-packages/swift/template/base.py", line 666, in generate
|
| 169 |
+
return model.generate(*args, **kwargs)
|
| 170 |
+
File "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/lib/python3.10/site-packages/peft/peft_model.py", line 2048, in generate
|
| 171 |
+
outputs = self.base_model.generate(*args, **kwargs)
|
| 172 |
+
File "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/lib/python3.10/site-packages/torch/utils/_contextlib.py", line 116, in decorate_context
|
| 173 |
+
return func(*args, **kwargs)
|
| 174 |
+
File "/mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/Qwen3-ASR/qwen_asr/core/transformers_backend/modeling_qwen3_asr.py", line 1353, in generate
|
| 175 |
+
thinker_result = self.thinker.generate(input_ids=input_ids, return_dict_in_generate=True, **thinker_kwargs)
|
| 176 |
+
File "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/lib/python3.10/site-packages/torch/utils/_contextlib.py", line 116, in decorate_context
|
| 177 |
+
return func(*args, **kwargs)
|
| 178 |
+
File "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/lib/python3.10/site-packages/transformers/generation/utils.py", line 2566, in generate
|
| 179 |
+
result = decoding_method(
|
| 180 |
+
File "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/lib/python3.10/site-packages/transformers/generation/utils.py", line 2789, in _sample
|
| 181 |
+
outputs = model_forward(**model_inputs, return_dict=True)
|
| 182 |
+
File "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/lib/python3.10/site-packages/torch/nn/modules/module.py", line 1739, in _wrapped_call_impl
|
| 183 |
+
return self._call_impl(*args, **kwargs)
|
| 184 |
+
File "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/lib/python3.10/site-packages/torch/nn/modules/module.py", line 1750, in _call_impl
|
| 185 |
+
return forward_call(*args, **kwargs)
|
| 186 |
+
File "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/lib/python3.10/site-packages/transformers/utils/generic.py", line 918, in wrapper
|
| 187 |
+
output = func(self, *args, **kwargs)
|
| 188 |
+
File "/mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/Qwen3-ASR/qwen_asr/core/transformers_backend/modeling_qwen3_asr.py", line 1230, in forward
|
| 189 |
+
outputs = self.model(
|
| 190 |
+
File "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/lib/python3.10/site-packages/torch/nn/modules/module.py", line 1739, in _wrapped_call_impl
|
| 191 |
+
return self._call_impl(*args, **kwargs)
|
| 192 |
+
File "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/lib/python3.10/site-packages/torch/nn/modules/module.py", line 1750, in _call_impl
|
| 193 |
+
return forward_call(*args, **kwargs)
|
| 194 |
+
File "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/lib/python3.10/site-packages/transformers/utils/generic.py", line 1072, in wrapper
|
| 195 |
+
outputs = func(self, *args, **kwargs)
|
| 196 |
+
File "/mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/Qwen3-ASR/qwen_asr/core/transformers_backend/modeling_qwen3_asr.py", line 1043, in forward
|
| 197 |
+
layer_outputs = decoder_layer(
|
| 198 |
+
File "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/lib/python3.10/site-packages/transformers/modeling_layers.py", line 94, in __call__
|
| 199 |
+
return super().__call__(*args, **kwargs)
|
| 200 |
+
File "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/lib/python3.10/site-packages/torch/nn/modules/module.py", line 1739, in _wrapped_call_impl
|
| 201 |
+
return self._call_impl(*args, **kwargs)
|
| 202 |
+
File "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/lib/python3.10/site-packages/torch/nn/modules/module.py", line 1750, in _call_impl
|
| 203 |
+
return forward_call(*args, **kwargs)
|
| 204 |
+
File "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/lib/python3.10/site-packages/transformers/utils/deprecation.py", line 172, in wrapped_func
|
| 205 |
+
return func(*args, **kwargs)
|
| 206 |
+
File "/mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/Qwen3-ASR/qwen_asr/core/transformers_backend/modeling_qwen3_asr.py", line 262, in forward
|
| 207 |
+
hidden_states, _ = self.self_attn(
|
| 208 |
+
File "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/lib/python3.10/site-packages/torch/nn/modules/module.py", line 1739, in _wrapped_call_impl
|
| 209 |
+
return self._call_impl(*args, **kwargs)
|
| 210 |
+
File "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/lib/python3.10/site-packages/torch/nn/modules/module.py", line 1750, in _call_impl
|
| 211 |
+
return forward_call(*args, **kwargs)
|
| 212 |
+
File "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/lib/python3.10/site-packages/transformers/utils/deprecation.py", line 172, in wrapped_func
|
| 213 |
+
return func(*args, **kwargs)
|
| 214 |
+
File "/mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/Qwen3-ASR/qwen_asr/core/transformers_backend/modeling_qwen3_asr.py", line 188, in forward
|
| 215 |
+
query_states = self.q_norm(self.q_proj(hidden_states).view(hidden_shape)).transpose(1, 2)
|
| 216 |
+
KeyboardInterrupt
|
| 217 |
+
[rank0]: Traceback (most recent call last):
|
| 218 |
+
[rank0]: File "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/lib/python3.10/site-packages/swift/cli/rlhf.py", line 7, in <module>
|
| 219 |
+
[rank0]: rlhf_main()
|
| 220 |
+
[rank0]: File "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/lib/python3.10/site-packages/swift/pipelines/train/rlhf.py", line 243, in rlhf_main
|
| 221 |
+
[rank0]: return SwiftRLHF(args).main()
|
| 222 |
+
[rank0]: File "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/lib/python3.10/site-packages/swift/pipelines/base.py", line 52, in main
|
| 223 |
+
[rank0]: result = self.run()
|
| 224 |
+
[rank0]: File "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/lib/python3.10/site-packages/swift/ray/base.py", line 168, in wrapper
|
| 225 |
+
[rank0]: return func(self, *args, **kwargs)
|
| 226 |
+
[rank0]: File "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/lib/python3.10/site-packages/swift/pipelines/train/sft.py", line 197, in run
|
| 227 |
+
[rank0]: return self.train(trainer)
|
| 228 |
+
[rank0]: File "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/lib/python3.10/site-packages/swift/pipelines/train/sft.py", line 270, in train
|
| 229 |
+
[rank0]: trainer.train(resume_checkpoint)
|
| 230 |
+
[rank0]: File "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/lib/python3.10/site-packages/swift/trainers/mixin.py", line 895, in train
|
| 231 |
+
[rank0]: res = super().train(*args, **kwargs)
|
| 232 |
+
[rank0]: File "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/lib/python3.10/site-packages/transformers/trainer.py", line 2325, in train
|
| 233 |
+
[rank0]: return inner_training_loop(
|
| 234 |
+
[rank0]: File "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/lib/python3.10/site-packages/transformers/trainer.py", line 2756, in _inner_training_loop
|
| 235 |
+
[rank0]: self._maybe_log_save_evaluate(
|
| 236 |
+
[rank0]: File "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/lib/python3.10/site-packages/swift/trainers/mixin.py", line 972, in _maybe_log_save_evaluate
|
| 237 |
+
[rank0]: super()._maybe_log_save_evaluate(tr_loss, *args, **kwargs)
|
| 238 |
+
[rank0]: File "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/lib/python3.10/site-packages/transformers/trainer.py", line 3221, in _maybe_log_save_evaluate
|
| 239 |
+
[rank0]: metrics = self._evaluate(trial, ignore_keys_for_eval)
|
| 240 |
+
[rank0]: File "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/lib/python3.10/site-packages/transformers/trainer.py", line 3170, in _evaluate
|
| 241 |
+
[rank0]: metrics = self.evaluate(ignore_keys=ignore_keys_for_eval)
|
| 242 |
+
[rank0]: File "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/lib/python3.10/site-packages/transformers/trainer.py", line 4489, in evaluate
|
| 243 |
+
[rank0]: output = eval_loop(
|
| 244 |
+
[rank0]: File "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/lib/python3.10/site-packages/swift/rlhf_trainers/grpo_trainer.py", line 1872, in evaluation_loop
|
| 245 |
+
[rank0]: output = super().evaluation_loop(dataloader, *args, **kwargs)
|
| 246 |
+
[rank0]: File "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/lib/python3.10/site-packages/transformers/trainer.py", line 4685, in evaluation_loop
|
| 247 |
+
[rank0]: losses, logits, labels = self.prediction_step(model, inputs, prediction_loss_only, ignore_keys=ignore_keys)
|
| 248 |
+
[rank0]: File "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/lib/python3.10/site-packages/trl/trainer/grpo_trainer.py", line 2293, in prediction_step
|
| 249 |
+
[rank0]: inputs = self._prepare_inputs(inputs)
|
| 250 |
+
[rank0]: File "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/lib/python3.10/site-packages/swift/rlhf_trainers/utils.py", line 607, in wrapper
|
| 251 |
+
[rank0]: return func(self, *args, **kwargs)
|
| 252 |
+
[rank0]: File "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/lib/python3.10/site-packages/swift/rlhf_trainers/grpo_trainer.py", line 208, in _prepare_inputs
|
| 253 |
+
[rank0]: inputs = self._generate_and_score_completions(generation_batch)
|
| 254 |
+
[rank0]: File "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/lib/python3.10/site-packages/swift/rlhf_trainers/utils.py", line 607, in wrapper
|
| 255 |
+
[rank0]: return func(self, *args, **kwargs)
|
| 256 |
+
[rank0]: File "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/lib/python3.10/site-packages/swift/rlhf_trainers/grpo_trainer.py", line 236, in _generate_and_score_completions
|
| 257 |
+
[rank0]: inputs = self._generate_completions(inputs)
|
| 258 |
+
[rank0]: File "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/lib/python3.10/site-packages/swift/rlhf_trainers/grpo_trainer.py", line 222, in _generate_completions
|
| 259 |
+
[rank0]: results = self._infer_single_or_multi_turn(inputs, self.request_config)
|
| 260 |
+
[rank0]: File "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/lib/python3.10/site-packages/swift/rlhf_trainers/rollout_mixin.py", line 733, in _infer_single_or_multi_turn
|
| 261 |
+
[rank0]: rollout_outputs: List[RolloutOutput] = self._rollout(inputs, request_config, is_global_inputs)
|
| 262 |
+
[rank0]: File "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/lib/python3.10/site-packages/swift/rlhf_trainers/rollout_mixin.py", line 697, in _rollout
|
| 263 |
+
[rank0]: rollout_outputs = self._colocate_rollout(inputs, request_config)
|
| 264 |
+
[rank0]: File "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/lib/python3.10/site-packages/swift/rlhf_trainers/rollout_mixin.py", line 1056, in _colocate_rollout
|
| 265 |
+
[rank0]: outputs: List[RolloutOutput] = self._engine_infer(infer_requests=inputs, request_config=request_config)
|
| 266 |
+
[rank0]: File "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/lib/python3.10/site-packages/swift/rlhf_trainers/rollout_mixin.py", line 1077, in _engine_infer
|
| 267 |
+
[rank0]: res = self.engine.infer(infer_requests, request_config, use_tqdm=use_tqdm)
|
| 268 |
+
[rank0]: File "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/lib/python3.10/site-packages/swift/infer_engine/transformers_engine.py", line 577, in infer
|
| 269 |
+
[rank0]: res += self._infer(infer_requests_samples, request_config, adapter_request=adapter_request)
|
| 270 |
+
[rank0]: File "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/lib/python3.10/site-packages/torch/utils/_contextlib.py", line 116, in decorate_context
|
| 271 |
+
[rank0]: return func(*args, **kwargs)
|
| 272 |
+
[rank0]: File "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/lib/python3.10/site-packages/swift/infer_engine/transformers_engine.py", line 546, in _infer
|
| 273 |
+
[rank0]: res = infer_func(**kwargs)
|
| 274 |
+
[rank0]: File "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/lib/python3.10/site-packages/swift/infer_engine/transformers_engine.py", line 397, in _infer_full
|
| 275 |
+
[rank0]: output = dict(self.template.generate(self.model, **generate_kwargs))
|
| 276 |
+
[rank0]: File "/mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/0416upload/my_qwen3_asr_dapo_register.py", line 670, in generate
|
| 277 |
+
[rank0]: return super().generate(model, *args, **kwargs)
|
| 278 |
+
[rank0]: File "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/lib/python3.10/site-packages/swift/template/base.py", line 666, in generate
|
| 279 |
+
[rank0]: return model.generate(*args, **kwargs)
|
| 280 |
+
[rank0]: File "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/lib/python3.10/site-packages/peft/peft_model.py", line 2048, in generate
|
| 281 |
+
[rank0]: outputs = self.base_model.generate(*args, **kwargs)
|
| 282 |
+
[rank0]: File "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/lib/python3.10/site-packages/torch/utils/_contextlib.py", line 116, in decorate_context
|
| 283 |
+
[rank0]: return func(*args, **kwargs)
|
| 284 |
+
[rank0]: File "/mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/Qwen3-ASR/qwen_asr/core/transformers_backend/modeling_qwen3_asr.py", line 1353, in generate
|
| 285 |
+
[rank0]: thinker_result = self.thinker.generate(input_ids=input_ids, return_dict_in_generate=True, **thinker_kwargs)
|
| 286 |
+
[rank0]: File "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/lib/python3.10/site-packages/torch/utils/_contextlib.py", line 116, in decorate_context
|
| 287 |
+
[rank0]: return func(*args, **kwargs)
|
| 288 |
+
[rank0]: File "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/lib/python3.10/site-packages/transformers/generation/utils.py", line 2566, in generate
|
| 289 |
+
[rank0]: result = decoding_method(
|
| 290 |
+
[rank0]: File "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/lib/python3.10/site-packages/transformers/generation/utils.py", line 2789, in _sample
|
| 291 |
+
[rank0]: outputs = model_forward(**model_inputs, return_dict=True)
|
| 292 |
+
[rank0]: File "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/lib/python3.10/site-packages/torch/nn/modules/module.py", line 1739, in _wrapped_call_impl
|
| 293 |
+
[rank0]: return self._call_impl(*args, **kwargs)
|
| 294 |
+
[rank0]: File "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/lib/python3.10/site-packages/torch/nn/modules/module.py", line 1750, in _call_impl
|
| 295 |
+
[rank0]: return forward_call(*args, **kwargs)
|
| 296 |
+
[rank0]: File "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/lib/python3.10/site-packages/transformers/utils/generic.py", line 918, in wrapper
|
| 297 |
+
[rank0]: output = func(self, *args, **kwargs)
|
| 298 |
+
[rank0]: File "/mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/Qwen3-ASR/qwen_asr/core/transformers_backend/modeling_qwen3_asr.py", line 1230, in forward
|
| 299 |
+
[rank0]: outputs = self.model(
|
| 300 |
+
[rank0]: File "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/lib/python3.10/site-packages/torch/nn/modules/module.py", line 1739, in _wrapped_call_impl
|
| 301 |
+
[rank0]: return self._call_impl(*args, **kwargs)
|
| 302 |
+
[rank0]: File "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/lib/python3.10/site-packages/torch/nn/modules/module.py", line 1750, in _call_impl
|
| 303 |
+
[rank0]: return forward_call(*args, **kwargs)
|
| 304 |
+
[rank0]: File "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/lib/python3.10/site-packages/transformers/utils/generic.py", line 1072, in wrapper
|
| 305 |
+
[rank0]: outputs = func(self, *args, **kwargs)
|
| 306 |
+
[rank0]: File "/mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/Qwen3-ASR/qwen_asr/core/transformers_backend/modeling_qwen3_asr.py", line 1043, in forward
|
| 307 |
+
[rank0]: layer_outputs = decoder_layer(
|
| 308 |
+
[rank0]: File "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/lib/python3.10/site-packages/transformers/modeling_layers.py", line 94, in __call__
|
| 309 |
+
[rank0]: return super().__call__(*args, **kwargs)
|
| 310 |
+
[rank0]: File "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/lib/python3.10/site-packages/torch/nn/modules/module.py", line 1739, in _wrapped_call_impl
|
| 311 |
+
[rank0]: return self._call_impl(*args, **kwargs)
|
| 312 |
+
[rank0]: File "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/lib/python3.10/site-packages/torch/nn/modules/module.py", line 1750, in _call_impl
|
| 313 |
+
[rank0]: return forward_call(*args, **kwargs)
|
| 314 |
+
[rank0]: File "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/lib/python3.10/site-packages/transformers/utils/deprecation.py", line 172, in wrapped_func
|
| 315 |
+
[rank0]: return func(*args, **kwargs)
|
| 316 |
+
[rank0]: File "/mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/Qwen3-ASR/qwen_asr/core/transformers_backend/modeling_qwen3_asr.py", line 262, in forward
|
| 317 |
+
[rank0]: hidden_states, _ = self.self_attn(
|
| 318 |
+
[rank0]: File "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/lib/python3.10/site-packages/torch/nn/modules/module.py", line 1739, in _wrapped_call_impl
|
| 319 |
+
[rank0]: return self._call_impl(*args, **kwargs)
|
| 320 |
+
[rank0]: File "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/lib/python3.10/site-packages/torch/nn/modules/module.py", line 1750, in _call_impl
|
| 321 |
+
[rank0]: return forward_call(*args, **kwargs)
|
| 322 |
+
[rank0]: File "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/lib/python3.10/site-packages/transformers/utils/deprecation.py", line 172, in wrapped_func
|
| 323 |
+
[rank0]: return func(*args, **kwargs)
|
| 324 |
+
[rank0]: File "/mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/Qwen3-ASR/qwen_asr/core/transformers_backend/modeling_qwen3_asr.py", line 188, in forward
|
| 325 |
+
[rank0]: query_states = self.q_norm(self.q_proj(hidden_states).view(hidden_shape)).transpose(1, 2)
|
| 326 |
+
[rank0]: KeyboardInterrupt
|
wandb/run-20260417_123237-3h84yfea/files/requirements.txt
ADDED
|
@@ -0,0 +1,255 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
psutil==7.2.2
|
| 2 |
+
colorama==0.4.6
|
| 3 |
+
typing-inspection==0.4.2
|
| 4 |
+
dill==0.3.8
|
| 5 |
+
aliyun-python-sdk-kms==2.16.5
|
| 6 |
+
urllib3==2.6.3
|
| 7 |
+
torch==2.6.0
|
| 8 |
+
threadpoolctl==3.6.0
|
| 9 |
+
pyzmq==27.1.0
|
| 10 |
+
astor==0.8.1
|
| 11 |
+
hf-xet==1.4.3
|
| 12 |
+
sniffio==1.3.1
|
| 13 |
+
tensorboard==2.20.0
|
| 14 |
+
fastar==0.11.0
|
| 15 |
+
llvmlite==0.43.0
|
| 16 |
+
pathspec==1.0.4
|
| 17 |
+
mkl_fft==1.3.11
|
| 18 |
+
prometheus_client==0.25.0
|
| 19 |
+
async-timeout==5.0.1
|
| 20 |
+
scikit-learn==1.7.2
|
| 21 |
+
sortedcontainers==2.4.0
|
| 22 |
+
Bottleneck==1.4.2
|
| 23 |
+
orjson==3.11.8
|
| 24 |
+
nest-asyncio==1.6.0
|
| 25 |
+
cupy-cuda12x==13.6.0
|
| 26 |
+
semantic-version==2.10.0
|
| 27 |
+
aiosignal==1.4.0
|
| 28 |
+
fsspec==2025.3.0
|
| 29 |
+
dyNET38==2.2
|
| 30 |
+
shellingham==1.5.4
|
| 31 |
+
zstandard==0.25.0
|
| 32 |
+
PyYAML==6.0.3
|
| 33 |
+
nvidia-curand-cu12==10.3.5.147
|
| 34 |
+
gradio==5.50.0
|
| 35 |
+
Werkzeug==3.1.8
|
| 36 |
+
grpcio==1.80.0
|
| 37 |
+
aiohttp==3.13.5
|
| 38 |
+
Flask==3.1.3
|
| 39 |
+
python-json-logger==4.1.0
|
| 40 |
+
trl==0.29.1
|
| 41 |
+
nltk==3.9.4
|
| 42 |
+
platformdirs==4.9.6
|
| 43 |
+
lm-format-enforcer==0.10.12
|
| 44 |
+
pyparsing==3.3.2
|
| 45 |
+
jmespath==0.10.0
|
| 46 |
+
starlette==0.52.1
|
| 47 |
+
crcmod==1.7
|
| 48 |
+
dnspython==2.8.0
|
| 49 |
+
antlr4-python3-runtime==4.9.3
|
| 50 |
+
rouge==1.0.1
|
| 51 |
+
importlib_metadata==9.0.0
|
| 52 |
+
nvidia-cudnn-cu12==9.1.0.70
|
| 53 |
+
safetensors==0.7.0
|
| 54 |
+
blake3==1.0.8
|
| 55 |
+
interegular==0.3.3
|
| 56 |
+
tiktoken==0.11.0
|
| 57 |
+
pydantic_core==2.41.4
|
| 58 |
+
outlines==0.1.11
|
| 59 |
+
airportsdata==20260315
|
| 60 |
+
rich-toolkit==0.19.7
|
| 61 |
+
multiprocess==0.70.16
|
| 62 |
+
sympy==1.13.1
|
| 63 |
+
psutil==7.2.2
|
| 64 |
+
h11==0.16.0
|
| 65 |
+
anyio==4.13.0
|
| 66 |
+
Cython==3.2.4
|
| 67 |
+
outlines_core==0.1.26
|
| 68 |
+
jsonschema==4.26.0
|
| 69 |
+
nvidia-cuda-cupti-cu12==12.4.127
|
| 70 |
+
meson-python==0.19.0
|
| 71 |
+
depyf==0.18.0
|
| 72 |
+
audioread==3.1.0
|
| 73 |
+
typer==0.24.1
|
| 74 |
+
nvidia-cuda-nvrtc-cu12==12.4.127
|
| 75 |
+
joblib==1.5.3
|
| 76 |
+
torchvision==0.21.0
|
| 77 |
+
hf-gradio==0.3.2
|
| 78 |
+
huggingface_hub==0.36.2
|
| 79 |
+
websockets==15.0.1
|
| 80 |
+
diskcache==5.6.3
|
| 81 |
+
mistral_common==1.11.0
|
| 82 |
+
partial-json-parser==0.2.1.1.post7
|
| 83 |
+
simplejson==3.20.2
|
| 84 |
+
watchfiles==1.1.1
|
| 85 |
+
Jinja2==3.1.6
|
| 86 |
+
GitPython==3.1.46
|
| 87 |
+
numexpr==2.11.0
|
| 88 |
+
pydub==0.25.1
|
| 89 |
+
brotli==1.2.0
|
| 90 |
+
binpacking==2.0.1
|
| 91 |
+
cmake==4.3.1
|
| 92 |
+
pydantic==2.12.3
|
| 93 |
+
mkl-service==2.4.0
|
| 94 |
+
protobuf==6.33.6
|
| 95 |
+
gguf==0.10.0
|
| 96 |
+
MarkupSafe==3.0.3
|
| 97 |
+
exceptiongroup==1.3.1
|
| 98 |
+
markdown-it-py==4.0.0
|
| 99 |
+
soxr==1.0.0
|
| 100 |
+
pyarrow==20.0.0
|
| 101 |
+
tqdm==4.67.3
|
| 102 |
+
meson==1.11.0
|
| 103 |
+
fonttools==4.62.1
|
| 104 |
+
annotated-types==0.7.0
|
| 105 |
+
networkx==3.4.2
|
| 106 |
+
nvidia-cuda-runtime-cu12==12.4.127
|
| 107 |
+
compressed-tensors==0.9.2
|
| 108 |
+
wandb==0.23.0
|
| 109 |
+
mdurl==0.1.2
|
| 110 |
+
charset-normalizer==3.4.7
|
| 111 |
+
Pygments==2.20.0
|
| 112 |
+
zipp==3.23.1
|
| 113 |
+
prometheus-fastapi-instrumentator==7.1.0
|
| 114 |
+
aiofiles==24.1.0
|
| 115 |
+
lark==1.2.2
|
| 116 |
+
addict==2.4.0
|
| 117 |
+
pydantic-settings==2.13.1
|
| 118 |
+
opencv-python-headless==4.11.0.86
|
| 119 |
+
certifi==2026.2.25
|
| 120 |
+
sox==1.5.0
|
| 121 |
+
nagisa==0.2.11
|
| 122 |
+
six==1.17.0
|
| 123 |
+
tokenizers==0.22.2
|
| 124 |
+
mkl_random==1.2.8
|
| 125 |
+
fastapi-cloud-cli==0.17.0
|
| 126 |
+
propcache==0.4.1
|
| 127 |
+
cachetools==7.0.5
|
| 128 |
+
rpds-py==0.30.0
|
| 129 |
+
torchaudio==2.6.0
|
| 130 |
+
setuptools==82.0.1
|
| 131 |
+
py-cpuinfo==9.0.0
|
| 132 |
+
tomli==2.4.1
|
| 133 |
+
xxhash==3.6.0
|
| 134 |
+
pip==26.0.1
|
| 135 |
+
contourpy==1.3.2
|
| 136 |
+
absl-py==2.4.0
|
| 137 |
+
mpmath==1.3.0
|
| 138 |
+
ms_swift==4.0.3
|
| 139 |
+
pyproject-metadata==0.11.0
|
| 140 |
+
aiohappyeyeballs==2.6.1
|
| 141 |
+
httpx==0.28.1
|
| 142 |
+
json_repair==0.59.4
|
| 143 |
+
blinker==1.9.0
|
| 144 |
+
tzdata==2025.3
|
| 145 |
+
tensorboard-data-server==0.7.2
|
| 146 |
+
pydantic-extra-types==2.11.1
|
| 147 |
+
Markdown==3.10.2
|
| 148 |
+
nvidia-cusparselt-cu12==0.6.2
|
| 149 |
+
rignore==0.7.6
|
| 150 |
+
openai==2.32.0
|
| 151 |
+
soundfile==0.13.1
|
| 152 |
+
lazy-loader==0.5
|
| 153 |
+
av==14.2.0
|
| 154 |
+
yarl==1.23.0
|
| 155 |
+
python-dateutil==2.9.0.post0
|
| 156 |
+
groovy==0.1.2
|
| 157 |
+
xformers==0.0.29.post2
|
| 158 |
+
qwen-omni-utils==0.0.9
|
| 159 |
+
rich==15.0.0
|
| 160 |
+
xgrammar==0.1.16
|
| 161 |
+
numba==0.60.0
|
| 162 |
+
nvidia-cusolver-cu12==11.6.1.9
|
| 163 |
+
scikit_build_core==0.12.2
|
| 164 |
+
ffmpy==1.0.0
|
| 165 |
+
wheel==0.46.3
|
| 166 |
+
jiter==0.14.0
|
| 167 |
+
oss2==2.19.1
|
| 168 |
+
transformers==4.57.6
|
| 169 |
+
fastrlock==0.8.3
|
| 170 |
+
click==8.3.2
|
| 171 |
+
pooch==1.9.0
|
| 172 |
+
distro==1.9.0
|
| 173 |
+
nvidia-cublas-cu12==12.4.5.8
|
| 174 |
+
regex==2026.4.4
|
| 175 |
+
cpm-kernels==1.0.11
|
| 176 |
+
safehttpx==0.1.7
|
| 177 |
+
matplotlib==3.10.8
|
| 178 |
+
httptools==0.7.1
|
| 179 |
+
nvidia-cusparse-cu12==12.3.1.170
|
| 180 |
+
qwen-asr==0.0.6
|
| 181 |
+
gradio_client==1.14.0
|
| 182 |
+
gitdb==4.0.12
|
| 183 |
+
fastapi-cli==0.0.24
|
| 184 |
+
soynlp==0.0.493
|
| 185 |
+
python-dotenv==1.2.2
|
| 186 |
+
nvidia-cufft-cu12==11.2.1.3
|
| 187 |
+
accelerate==1.12.0
|
| 188 |
+
tomlkit==0.13.3
|
| 189 |
+
triton==3.2.0
|
| 190 |
+
filelock==3.28.0
|
| 191 |
+
pycountry==26.2.16
|
| 192 |
+
modelscope==1.35.4
|
| 193 |
+
annotated-doc==0.0.4
|
| 194 |
+
referencing==0.37.0
|
| 195 |
+
numpy==1.26.4
|
| 196 |
+
aliyun-python-sdk-core==2.16.0
|
| 197 |
+
attrs==26.1.0
|
| 198 |
+
vllm==0.8.0
|
| 199 |
+
python-multipart==0.0.26
|
| 200 |
+
jsonschema-specifications==2025.9.1
|
| 201 |
+
idna==3.11
|
| 202 |
+
scipy==1.15.3
|
| 203 |
+
typing_extensions==4.15.0
|
| 204 |
+
itsdangerous==2.2.0
|
| 205 |
+
msgspec==0.21.1
|
| 206 |
+
msgpack==1.1.2
|
| 207 |
+
nvidia-nvjitlink-cu12==12.4.127
|
| 208 |
+
pycryptodome==3.23.0
|
| 209 |
+
ninja==1.13.0
|
| 210 |
+
pillow==11.3.0
|
| 211 |
+
email-validator==2.3.0
|
| 212 |
+
cryptography==46.0.7
|
| 213 |
+
peft==0.18.1
|
| 214 |
+
kiwisolver==1.5.0
|
| 215 |
+
cffi==2.0.0
|
| 216 |
+
einops==0.8.2
|
| 217 |
+
pytz==2026.1.post1
|
| 218 |
+
uvloop==0.22.1
|
| 219 |
+
requests==2.33.1
|
| 220 |
+
sentencepiece==0.2.1
|
| 221 |
+
attrdict==2.0.1
|
| 222 |
+
dacite==1.9.2
|
| 223 |
+
cloudpickle==3.1.2
|
| 224 |
+
ray==2.55.0
|
| 225 |
+
fastapi==0.135.3
|
| 226 |
+
librosa==0.11.0
|
| 227 |
+
ruff==0.15.10
|
| 228 |
+
multidict==6.7.1
|
| 229 |
+
smmap==5.0.3
|
| 230 |
+
packaging==26.0
|
| 231 |
+
pycparser==3.0
|
| 232 |
+
decorator==5.2.1
|
| 233 |
+
transformers-stream-generator==0.0.5
|
| 234 |
+
nvidia-nccl-cu12==2.21.5
|
| 235 |
+
frozenlist==1.8.0
|
| 236 |
+
uvicorn==0.44.0
|
| 237 |
+
datasets==3.6.0
|
| 238 |
+
cycler==0.12.1
|
| 239 |
+
omegaconf==2.3.0
|
| 240 |
+
httpcore==1.0.9
|
| 241 |
+
pandas==2.3.2
|
| 242 |
+
nvidia-nvtx-cu12==12.4.127
|
| 243 |
+
sentry-sdk==2.58.0
|
| 244 |
+
wheel==0.46.3
|
| 245 |
+
autocommand==2.2.2
|
| 246 |
+
tomli==2.4.0
|
| 247 |
+
packaging==26.0
|
| 248 |
+
more-itertools==10.8.0
|
| 249 |
+
zipp==3.23.0
|
| 250 |
+
platformdirs==4.4.0
|
| 251 |
+
jaraco.context==6.1.0
|
| 252 |
+
jaraco.text==4.0.0
|
| 253 |
+
backports.tarfile==1.2.0
|
| 254 |
+
jaraco.functools==4.4.0
|
| 255 |
+
importlib_metadata==8.7.1
|
wandb/run-20260417_123237-3h84yfea/files/wandb-metadata.json
ADDED
|
@@ -0,0 +1,223 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"os": "Linux-3.10.0-957.el7.x86_64-x86_64-with-glibc2.17",
|
| 3 |
+
"python": "CPython 3.10.18",
|
| 4 |
+
"startedAt": "2026-04-17T04:32:37.414555Z",
|
| 5 |
+
"args": [
|
| 6 |
+
"--rlhf_type",
|
| 7 |
+
"grpo",
|
| 8 |
+
"--external_plugins",
|
| 9 |
+
"/mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/0416upload/my_qwen3_asr_dapo_register.py",
|
| 10 |
+
"/mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/0416upload/0417_reward.py",
|
| 11 |
+
"--model",
|
| 12 |
+
"/mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/qwen3-asr-merged",
|
| 13 |
+
"--model_type",
|
| 14 |
+
"my_qwen3_asr_rl",
|
| 15 |
+
"--template",
|
| 16 |
+
"my_qwen3_asr_rl",
|
| 17 |
+
"--dataset",
|
| 18 |
+
"/mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/0416upload/lora_0323_10w+55w+error+syn_with_domain_train90_targeted_rl_train90_loramerged_basewer_3suppress_server.jsonl",
|
| 19 |
+
"--val_dataset",
|
| 20 |
+
"/mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/0416upload/lora_0323_10w+55w+error+syn_with_domain_train90_targeted_rl_val5_sample5p_server.jsonl",
|
| 21 |
+
"--reward_funcs",
|
| 22 |
+
"asr_wer_sub_len_cmp_hallu_dirty_v56",
|
| 23 |
+
"--train_type",
|
| 24 |
+
"lora",
|
| 25 |
+
"--use_vllm",
|
| 26 |
+
"false",
|
| 27 |
+
"--log_completions",
|
| 28 |
+
"true",
|
| 29 |
+
"--loss_type",
|
| 30 |
+
"dapo",
|
| 31 |
+
"--advantage_estimator",
|
| 32 |
+
"grpo",
|
| 33 |
+
"--scale_rewards",
|
| 34 |
+
"group",
|
| 35 |
+
"--num_iterations",
|
| 36 |
+
"2",
|
| 37 |
+
"--beta",
|
| 38 |
+
"0.04",
|
| 39 |
+
"--epsilon_high",
|
| 40 |
+
"0.28",
|
| 41 |
+
"--dynamic_sample",
|
| 42 |
+
"true",
|
| 43 |
+
"--max_resample_times",
|
| 44 |
+
"4",
|
| 45 |
+
"--overlong_filter",
|
| 46 |
+
"true",
|
| 47 |
+
"--truncation_strategy",
|
| 48 |
+
"delete",
|
| 49 |
+
"--num_generations",
|
| 50 |
+
"12",
|
| 51 |
+
"--generation_batch_size",
|
| 52 |
+
"48",
|
| 53 |
+
"--per_device_train_batch_size",
|
| 54 |
+
"8",
|
| 55 |
+
"--per_device_eval_batch_size",
|
| 56 |
+
"8",
|
| 57 |
+
"--gradient_accumulation_steps",
|
| 58 |
+
"12",
|
| 59 |
+
"--num_generations_eval",
|
| 60 |
+
"4",
|
| 61 |
+
"--max_completion_length",
|
| 62 |
+
"256",
|
| 63 |
+
"--temperature",
|
| 64 |
+
"0.50",
|
| 65 |
+
"--top_p",
|
| 66 |
+
"0.95",
|
| 67 |
+
"--top_k",
|
| 68 |
+
"50",
|
| 69 |
+
"--repetition_penalty",
|
| 70 |
+
"1.08",
|
| 71 |
+
"--learning_rate",
|
| 72 |
+
"5e-5",
|
| 73 |
+
"--lr_scheduler_type",
|
| 74 |
+
"cosine",
|
| 75 |
+
"--warmup_ratio",
|
| 76 |
+
"0.03",
|
| 77 |
+
"--report_to",
|
| 78 |
+
"wandb",
|
| 79 |
+
"--run_name",
|
| 80 |
+
"qwen3asr_dapo_reward56_4x4x12_12gen_4GPU",
|
| 81 |
+
"--output_dir",
|
| 82 |
+
"/mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/0416upload/out/qwen3asr_dapo_reward56_4x4x12_12gen_4GPU",
|
| 83 |
+
"--save_strategy",
|
| 84 |
+
"steps",
|
| 85 |
+
"--save_steps",
|
| 86 |
+
"20",
|
| 87 |
+
"--logging_steps",
|
| 88 |
+
"5",
|
| 89 |
+
"--freeze_llm",
|
| 90 |
+
"false",
|
| 91 |
+
"--freeze_vit",
|
| 92 |
+
"false",
|
| 93 |
+
"--freeze_aligner",
|
| 94 |
+
"false",
|
| 95 |
+
"--remove_unused_columns",
|
| 96 |
+
"false",
|
| 97 |
+
"--padding_side",
|
| 98 |
+
"left"
|
| 99 |
+
],
|
| 100 |
+
"program": "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/lib/python3.10/site-packages/swift/cli/rlhf.py",
|
| 101 |
+
"email": "pang_kaiyu@163.com",
|
| 102 |
+
"root": "/mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/0416upload",
|
| 103 |
+
"host": "SH-IDC1-10-140-37-1",
|
| 104 |
+
"executable": "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/bin/python3.10",
|
| 105 |
+
"cpu_count": 64,
|
| 106 |
+
"cpu_count_logical": 128,
|
| 107 |
+
"gpu": "NVIDIA A100-SXM4-80GB",
|
| 108 |
+
"gpu_count": 8,
|
| 109 |
+
"disk": {
|
| 110 |
+
"/": {
|
| 111 |
+
"total": "524945911808",
|
| 112 |
+
"used": "105544630272"
|
| 113 |
+
}
|
| 114 |
+
},
|
| 115 |
+
"memory": {
|
| 116 |
+
"total": "1081627828224"
|
| 117 |
+
},
|
| 118 |
+
"gpu_nvidia": [
|
| 119 |
+
{
|
| 120 |
+
"name": "NVIDIA A100-SXM4-80GB",
|
| 121 |
+
"memoryTotal": "85899345920",
|
| 122 |
+
"cudaCores": 6912,
|
| 123 |
+
"architecture": "Ampere",
|
| 124 |
+
"uuid": "GPU-51466de9-a668-3c7e-bb90-bb8c112e0fea"
|
| 125 |
+
},
|
| 126 |
+
{
|
| 127 |
+
"name": "NVIDIA A100-SXM4-80GB",
|
| 128 |
+
"memoryTotal": "85899345920",
|
| 129 |
+
"cudaCores": 6912,
|
| 130 |
+
"architecture": "Ampere",
|
| 131 |
+
"uuid": "GPU-ec1a5f87-66dd-26c2-5656-b57c7015a595"
|
| 132 |
+
},
|
| 133 |
+
{
|
| 134 |
+
"name": "NVIDIA A100-SXM4-80GB",
|
| 135 |
+
"memoryTotal": "85899345920",
|
| 136 |
+
"cudaCores": 6912,
|
| 137 |
+
"architecture": "Ampere",
|
| 138 |
+
"uuid": "GPU-2dabb104-8ec6-09ec-017a-204779e18c19"
|
| 139 |
+
},
|
| 140 |
+
{
|
| 141 |
+
"name": "NVIDIA A100-SXM4-80GB",
|
| 142 |
+
"memoryTotal": "85899345920",
|
| 143 |
+
"cudaCores": 6912,
|
| 144 |
+
"architecture": "Ampere",
|
| 145 |
+
"uuid": "GPU-0e67540a-1930-f39b-320f-0a6bfe1da2e0"
|
| 146 |
+
},
|
| 147 |
+
{
|
| 148 |
+
"name": "NVIDIA A100-SXM4-80GB",
|
| 149 |
+
"memoryTotal": "85899345920",
|
| 150 |
+
"cudaCores": 6912,
|
| 151 |
+
"architecture": "Ampere",
|
| 152 |
+
"uuid": "GPU-b46e583c-5ac8-e350-6045-49ad7b17c092"
|
| 153 |
+
},
|
| 154 |
+
{
|
| 155 |
+
"name": "NVIDIA A100-SXM4-80GB",
|
| 156 |
+
"memoryTotal": "85899345920",
|
| 157 |
+
"cudaCores": 6912,
|
| 158 |
+
"architecture": "Ampere",
|
| 159 |
+
"uuid": "GPU-f293d16a-41a0-fbc1-e86c-4f9682cb5e2b"
|
| 160 |
+
},
|
| 161 |
+
{
|
| 162 |
+
"name": "NVIDIA A100-SXM4-80GB",
|
| 163 |
+
"memoryTotal": "85899345920",
|
| 164 |
+
"cudaCores": 6912,
|
| 165 |
+
"architecture": "Ampere",
|
| 166 |
+
"uuid": "GPU-67958330-9199-dca8-5c2e-c665b13b3452"
|
| 167 |
+
},
|
| 168 |
+
{
|
| 169 |
+
"name": "NVIDIA A100-SXM4-80GB",
|
| 170 |
+
"memoryTotal": "85899345920",
|
| 171 |
+
"cudaCores": 6912,
|
| 172 |
+
"architecture": "Ampere",
|
| 173 |
+
"uuid": "GPU-6b56602f-4dcf-cb9d-4e98-04bf6254b789"
|
| 174 |
+
}
|
| 175 |
+
],
|
| 176 |
+
"cudaVersion": "12.4",
|
| 177 |
+
"slurm": {
|
| 178 |
+
"cluster_name": "cluster_sproject3",
|
| 179 |
+
"conf": "/etc/slurm/slurm.conf",
|
| 180 |
+
"cpus_on_node": "2",
|
| 181 |
+
"gtids": "0",
|
| 182 |
+
"job_account": "research",
|
| 183 |
+
"job_cpus_per_node": "2",
|
| 184 |
+
"job_gid": "800000689",
|
| 185 |
+
"job_id": "8568802",
|
| 186 |
+
"job_name": "qwen_debug",
|
| 187 |
+
"job_nodelist": "SH-IDC1-10-140-37-1",
|
| 188 |
+
"job_num_nodes": "1",
|
| 189 |
+
"job_partition": "interntmp",
|
| 190 |
+
"job_qos": "normal",
|
| 191 |
+
"job_uid": "800000689",
|
| 192 |
+
"job_user": "panjiabao",
|
| 193 |
+
"jobid": "8568802",
|
| 194 |
+
"launch_node_ipaddr": "10.140.37.164",
|
| 195 |
+
"localid": "0",
|
| 196 |
+
"nnodes": "1",
|
| 197 |
+
"nodeid": "0",
|
| 198 |
+
"nodelist": "SH-IDC1-10-140-37-1",
|
| 199 |
+
"nprocs": "1",
|
| 200 |
+
"ntasks": "1",
|
| 201 |
+
"prio_process": "0",
|
| 202 |
+
"procid": "0",
|
| 203 |
+
"srun_comm_host": "10.140.37.164",
|
| 204 |
+
"srun_comm_port": "44570",
|
| 205 |
+
"step_gpus": "4,5",
|
| 206 |
+
"step_id": "0",
|
| 207 |
+
"step_launcher_port": "44570",
|
| 208 |
+
"step_nodelist": "SH-IDC1-10-140-37-1",
|
| 209 |
+
"step_num_nodes": "1",
|
| 210 |
+
"step_num_tasks": "1",
|
| 211 |
+
"step_tasks_per_node": "1",
|
| 212 |
+
"stepid": "0",
|
| 213 |
+
"submit_dir": "/mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/0416upload",
|
| 214 |
+
"submit_host": "SH-IDC1-10-140-37-164",
|
| 215 |
+
"task_pid": "24357",
|
| 216 |
+
"tasks_per_node": "1",
|
| 217 |
+
"topology_addr": "SH-IDC1-10-140-37-1",
|
| 218 |
+
"topology_addr_pattern": "node",
|
| 219 |
+
"umask": "0002",
|
| 220 |
+
"working_cluster": "cluster_sproject3:SH-IDC1-10-140-37-161:6817:9216:109"
|
| 221 |
+
},
|
| 222 |
+
"writerId": "bpic2cpmtxvnwca2pu2tg19g1j2qwpb2"
|
| 223 |
+
}
|
wandb/run-20260417_123237-3h84yfea/files/wandb-summary.json
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"_step":10,"train/clip_ratio/high_max":0.012200319871772081,"_runtime":1109.549686456,"train/rewards/ASRWerSubLenCmpHalluDirtyV56/std":0.4208546429872513,"profiling/Time taken: GRPOTrainer.ASRWerSubLenCmpHalluDirtyV56":0.05729236314073205,"train/learning_rate":3.5714285714285714e-06,"profiling/Time taken: GRPOTrainer._prepare_batch_inputs":0.7034707930870354,"train/reward":0.022321835905313493,"profiling/Time taken: GRPOTrainer.generate":3.802002454176545,"train/epoch":0.0064329366355741395,"train/frac_reward_zero_std":0,"train/clip_ratio/low_mean":0.014095272546789299,"train/clip_ratio/region_mean":0.02252715122886002,"train/completions/max_length":61.4,"train/completions/mean_length":48.42812652587891,"train/completions/min_length":30.25,"train/clip_ratio/low_min":0.008001556829549372,"train/kl":0.00529333179583773,"completions":{"path":"media/table/completions_9_ec21142175e3781c9ddd.table.json","ncols":6,"log_mode":"IMMUTABLE","_type":"table-file","artifact_path":"wandb-client-artifact://kz4vrnypdmle4zgoj3c84weqxmxkvdxftnrs55geadw9knsskgfo49q6n1xtl9bk3gu4h9ojvabrseb66dnps3myxgfrem7lvv7fjv618wfxr5ofpjviqu6xhn9nlkki/completions.table.json","size":30810,"nrows":48,"_latest_artifact_path":"wandb-client-artifact://b69jh609tckqry5pvjdgc75co4t33phnplrzajmhbdyubzbumzvvphifhlwul9nw1lkqc2xwcxwq9l1gnv9ymu6hjz8nv21mkh590wyd7n2m3v6vfjc58y4w8x9kkji0:latest/completions.table.json","sha256":"ec21142175e3781c9ddd0e8bcbb9129cea8a4112a1677ab3a9541e1a4670ca03"},"profiling/Time taken: GRPOTrainer.compute_loss":0.38397085713222623,"train/clip_ratio/high_mean":0.008431878668488935,"train/global_step":20,"train/step_time":25.729406683100386,"profiling/Time taken: GRPOTrainer._score_completions":0.05837428104132414,"profiling/Time taken: GRPOTrainer.log_metrics":0.00924607808701694,"train/loss":0.0031860221177339556,"_wandb":{"runtime":1109},"profiling/Time taken: GRPOTrainer._get_per_token_logps_and_entropies":0.34411595296114683,"profiling/Time taken: GRPOTrainer._generate_and_score_completions":4.66908916993998,"_timestamp":1.7764014649839177e+09,"profiling/Time taken: GRPOTrainer._prepare_inputs":4.669255583081394,"train/reward_std":0.1609206058084965,"train/completions/clipped_ratio":0,"profiling/Time taken: GRPOTrainer.resample_encode_failed_inputs":0.07994826301001012,"profiling/Time taken: GRPOTrainer._dynamic_sampling":1.0511806420981884,"train/rewards/ASRWerSubLenCmpHalluDirtyV56/mean":0.02232184025924653,"train/grad_norm":0.908744215965271}
|
wandb/run-20260417_123237-3h84yfea/logs/debug-core.log
ADDED
|
@@ -0,0 +1,14 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{"time":"2026-04-17T12:32:37.733571714+08:00","level":"INFO","msg":"main: starting server","port-filename":"/tmp/tmp6lseefed/port-26590.txt","pid":26590,"log-level":0,"disable-analytics":false,"shutdown-on-parent-exit":false,"enable-dcgm-profiling":false}
|
| 2 |
+
{"time":"2026-04-17T12:32:37.736196619+08:00","level":"INFO","msg":"server: will exit if parent process dies","ppid":26590}
|
| 3 |
+
{"time":"2026-04-17T12:32:37.736232389+08:00","level":"INFO","msg":"server: accepting connections","addr":{"Name":"/tmp/wandb-26590-39544-1290766967/socket","Net":"unix"}}
|
| 4 |
+
{"time":"2026-04-17T12:32:37.819031966+08:00","level":"INFO","msg":"connection: ManageConnectionData: new connection created","id":"1(@)"}
|
| 5 |
+
{"time":"2026-04-17T12:32:37.828108271+08:00","level":"INFO","msg":"handleInformInit: received","streamId":"3h84yfea","id":"1(@)"}
|
| 6 |
+
{"time":"2026-04-17T12:32:38.291204091+08:00","level":"INFO","msg":"handleInformInit: stream started","streamId":"3h84yfea","id":"1(@)"}
|
| 7 |
+
{"time":"2026-04-17T12:51:08.851141958+08:00","level":"INFO","msg":"handleInformTeardown: server teardown initiated","id":"1(@)"}
|
| 8 |
+
{"time":"2026-04-17T12:51:08.851692926+08:00","level":"INFO","msg":"server is shutting down"}
|
| 9 |
+
{"time":"2026-04-17T12:51:08.851679858+08:00","level":"INFO","msg":"connection: closing","id":"1(@)"}
|
| 10 |
+
{"time":"2026-04-17T12:51:08.852412712+08:00","level":"INFO","msg":"server: listener closed","addr":{"Name":"/tmp/wandb-26590-39544-1290766967/socket","Net":"unix"}}
|
| 11 |
+
{"time":"2026-04-17T12:51:08.852821471+08:00","level":"INFO","msg":"connection: closed successfully","id":"1(@)"}
|
| 12 |
+
{"time":"2026-04-17T12:51:45.045595577+08:00","level":"INFO","msg":"handleInformTeardown: server shutdown complete","id":"1(@)"}
|
| 13 |
+
{"time":"2026-04-17T12:51:45.046301783+08:00","level":"INFO","msg":"connection: ManageConnectionData: connection closed","id":"1(@)"}
|
| 14 |
+
{"time":"2026-04-17T12:51:45.046872221+08:00","level":"INFO","msg":"server is closed"}
|
wandb/run-20260417_123237-3h84yfea/logs/debug-internal.log
ADDED
|
@@ -0,0 +1,14 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{"time":"2026-04-17T12:32:37.831597637+08:00","level":"INFO","msg":"stream: starting","core version":"0.23.0"}
|
| 2 |
+
{"time":"2026-04-17T12:32:38.28711188+08:00","level":"INFO","msg":"stream: created new stream","id":"3h84yfea"}
|
| 3 |
+
{"time":"2026-04-17T12:32:38.287178211+08:00","level":"INFO","msg":"handler: started","stream_id":"3h84yfea"}
|
| 4 |
+
{"time":"2026-04-17T12:32:38.291195021+08:00","level":"INFO","msg":"stream: started","id":"3h84yfea"}
|
| 5 |
+
{"time":"2026-04-17T12:32:38.291204401+08:00","level":"INFO","msg":"sender: started","stream_id":"3h84yfea"}
|
| 6 |
+
{"time":"2026-04-17T12:32:38.291218278+08:00","level":"INFO","msg":"writer: started","stream_id":"3h84yfea"}
|
| 7 |
+
{"time":"2026-04-17T12:47:19.109479888+08:00","level":"INFO","msg":"api: retrying HTTP error","status":500,"url":"https://api.wandb.ai/files/pang_kaiyu-none/qwen3_asr_swift_dapo/3h84yfea/file_stream","body":"{\"error\":\"context deadline exceeded\"}"}
|
| 8 |
+
{"time":"2026-04-17T12:51:08.790892907+08:00","level":"INFO","msg":"flowcontrol: backed up, offloading to disk","recordNumber":1780}
|
| 9 |
+
{"time":"2026-04-17T12:51:08.792427055+08:00","level":"INFO","msg":"flowcontrol: unblocked","totalOffloaded":34}
|
| 10 |
+
{"time":"2026-04-17T12:51:08.85169372+08:00","level":"INFO","msg":"stream: closing","id":"3h84yfea"}
|
| 11 |
+
{"time":"2026-04-17T12:51:10.104739264+08:00","level":"INFO","msg":"fileTransfer: Close: file transfer manager closed"}
|
| 12 |
+
{"time":"2026-04-17T12:51:45.039416039+08:00","level":"INFO","msg":"handler: closed","stream_id":"3h84yfea"}
|
| 13 |
+
{"time":"2026-04-17T12:51:45.041478496+08:00","level":"INFO","msg":"sender: closed","stream_id":"3h84yfea"}
|
| 14 |
+
{"time":"2026-04-17T12:51:45.041508452+08:00","level":"INFO","msg":"stream: closed","id":"3h84yfea"}
|
wandb/run-20260417_123237-3h84yfea/logs/debug.log
ADDED
|
@@ -0,0 +1,26 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
2026-04-17 12:32:37,468 INFO MainThread:26590 [wandb_setup.py:_flush():80] Current SDK version is 0.23.0
|
| 2 |
+
2026-04-17 12:32:37,468 INFO MainThread:26590 [wandb_setup.py:_flush():80] Configure stats pid to 26590
|
| 3 |
+
2026-04-17 12:32:37,468 INFO MainThread:26590 [wandb_setup.py:_flush():80] Loading settings from /mnt/petrelfs/panjiabao/.config/wandb/settings
|
| 4 |
+
2026-04-17 12:32:37,468 INFO MainThread:26590 [wandb_setup.py:_flush():80] Loading settings from /mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/0416upload/wandb/settings
|
| 5 |
+
2026-04-17 12:32:37,468 INFO MainThread:26590 [wandb_setup.py:_flush():80] Loading settings from environment variables
|
| 6 |
+
2026-04-17 12:32:37,468 INFO MainThread:26590 [wandb_init.py:setup_run_log_directory():713] Logging user logs to /mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/0416upload/wandb/run-20260417_123237-3h84yfea/logs/debug.log
|
| 7 |
+
2026-04-17 12:32:37,468 INFO MainThread:26590 [wandb_init.py:setup_run_log_directory():714] Logging internal logs to /mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/0416upload/wandb/run-20260417_123237-3h84yfea/logs/debug-internal.log
|
| 8 |
+
2026-04-17 12:32:37,468 INFO MainThread:26590 [wandb_init.py:init():840] calling init triggers
|
| 9 |
+
2026-04-17 12:32:37,468 INFO MainThread:26590 [wandb_init.py:init():845] wandb.init called with sweep_config: {}
|
| 10 |
+
config: {'_wandb': {}}
|
| 11 |
+
2026-04-17 12:32:37,468 INFO MainThread:26590 [wandb_init.py:init():888] starting backend
|
| 12 |
+
2026-04-17 12:32:37,819 INFO MainThread:26590 [wandb_init.py:init():891] sending inform_init request
|
| 13 |
+
2026-04-17 12:32:37,823 INFO MainThread:26590 [wandb_init.py:init():899] backend started and connected
|
| 14 |
+
2026-04-17 12:32:37,825 INFO MainThread:26590 [wandb_init.py:init():969] updated telemetry
|
| 15 |
+
2026-04-17 12:32:37,826 INFO MainThread:26590 [wandb_init.py:init():993] communicating run to backend with 90.0 second timeout
|
| 16 |
+
2026-04-17 12:32:39,301 INFO MainThread:26590 [wandb_init.py:init():1040] starting run threads in backend
|
| 17 |
+
2026-04-17 12:32:39,937 INFO MainThread:26590 [wandb_run.py:_console_start():2504] atexit reg
|
| 18 |
+
2026-04-17 12:32:39,937 INFO MainThread:26590 [wandb_run.py:_redirect():2352] redirect: wrap_raw
|
| 19 |
+
2026-04-17 12:32:39,937 INFO MainThread:26590 [wandb_run.py:_redirect():2421] Wrapping output streams.
|
| 20 |
+
2026-04-17 12:32:39,937 INFO MainThread:26590 [wandb_run.py:_redirect():2444] Redirects installed.
|
| 21 |
+
2026-04-17 12:32:39,944 INFO MainThread:26590 [wandb_init.py:init():1080] run started, returning control to user process
|
| 22 |
+
2026-04-17 12:32:39,949 INFO MainThread:26590 [wandb_run.py:_config_callback():1385] config_cb None None {'peft_config': {'default': {'task_type': 'CAUSAL_LM', 'peft_type': 'LORA', 'auto_mapping': None, 'peft_version': '0.18.1', 'base_model_name_or_path': '/mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/qwen3-asr-merged', 'revision': None, 'inference_mode': False, 'r': 8, 'target_modules': '^(thinker\\.model(?=\\.).*\\.(up_proj|v_proj|k_proj|o_proj|q_proj|gate_proj|down_proj)|thinker\\.audio_tower\\.layers(?=\\.).*\\.(v_proj|fc2|k_proj|fc1|q_proj|out_proj)|thinker\\.audio_tower\\.conv_out(?=\\.)|thinker\\.audio_tower\\.proj1(?=\\.)|thinker\\.audio_tower\\.proj2(?=\\.))$', 'exclude_modules': None, 'lora_alpha': 32, 'lora_dropout': 0.05, 'fan_in_fan_out': False, 'bias': 'none', 'use_rslora': False, 'modules_to_save': [], 'init_lora_weights': True, 'layers_to_transform': None, 'layers_pattern': None, 'rank_pattern': {}, 'alpha_pattern': {}, 'megatron_config': None, 'megatron_core': 'megatron.core', 'trainable_token_indices': None, 'loftq_config': {}, 'eva_config': None, 'corda_config': None, 'use_dora': False, 'alora_invocation_tokens': None, 'use_qalora': False, 'qalora_group_size': 16, 'layer_replication': None, 'runtime_config': {'ephemeral_gpu_offload': False}, 'lora_bias': False, 'target_parameters': None, 'arrow_config': None, 'ensure_weight_tying': False, 'lora_dtype': None, 'lorap_lr_ratio': None, 'lorap_emb_lr': 1e-06}}, 'return_dict': True, 'output_hidden_states': False, 'torchscript': False, 'dtype': 'bfloat16', 'pruned_heads': {}, 'tie_word_embeddings': True, 'chunk_size_feed_forward': 0, 'is_encoder_decoder': False, 'is_decoder': False, 'cross_attention_hidden_size': None, 'add_cross_attention': False, 'tie_encoder_decoder': False, 'architectures': ['Qwen3ASRForConditionalGeneration'], 'finetuning_task': None, 'id2label': {0: 'LABEL_0', 1: 'LABEL_1'}, 'label2id': {'LABEL_0': 0, 'LABEL_1': 1}, 'task_specific_params': None, 'problem_type': None, 'tokenizer_class': None, 'prefix': None, 'bos_token_id': None, 'pad_token_id': 151643, 'eos_token_id': 151645, 'sep_token_id': None, 'decoder_start_token_id': None, 'max_length': 20, 'min_length': 0, 'do_sample': False, 'early_stopping': False, 'num_beams': 1, 'temperature': 0.5, 'top_k': 50, 'top_p': 0.95, 'typical_p': 1.0, 'repetition_penalty': 1.08, 'length_penalty': 1.0, 'no_repeat_ngram_size': 0, 'encoder_no_repeat_ngram_size': 0, 'bad_words_ids': None, 'num_return_sequences': 1, 'output_scores': False, 'return_dict_in_generate': False, 'forced_bos_token_id': None, 'forced_eos_token_id': None, 'remove_invalid_values': False, 'exponential_decay_length_penalty': None, 'suppress_tokens': None, 'begin_suppress_tokens': None, 'num_beam_groups': 1, 'diversity_penalty': 0.0, '_name_or_path': '/mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/qwen3-asr-merged', 'transformers_version': '4.57.6', 'model_type': 'qwen3_asr', 'tf_legacy_loss': False, 'use_bfloat16': False, 'thinker_config': {'return_dict': True, 'output_hidden_states': False, 'torchscript': False, 'dtype': 'bfloat16', 'pruned_heads': {}, 'tie_word_embeddings': True, 'chunk_size_feed_forward': 0, 'is_encoder_decoder': False, 'is_decoder': False, 'cross_attention_hidden_size': None, 'add_cross_attention': False, 'tie_encoder_decoder': False, 'architectures': ['Qwen3ASRForConditionalGeneration'], 'finetuning_task': None, 'id2label': {0: 'LABEL_0', 1: 'LABEL_1'}, 'label2id': {'LABEL_0': 0, 'LABEL_1': 1}, 'task_specific_params': None, 'problem_type': None, 'tokenizer_class': None, 'prefix': None, 'bos_token_id': None, 'pad_token_id': None, 'eos_token_id': None, 'sep_token_id': None, 'decoder_start_token_id': None, 'max_length': 20, 'min_length': 0, 'do_sample': False, 'early_stopping': False, 'num_beams': 1, 'temperature': 1.0, 'top_k': 50, 'top_p': 1.0, 'typical_p': 1.0, 'repetition_penalty': 1.0, 'length_penalty': 1.0, 'no_repeat_ngram_size': 0, 'encoder_no_repeat_ngram_size': 0, 'bad_words_ids': None, 'num_return_sequences': 1, 'output_scores': False, 'return_dict_in_generate': False, 'forced_bos_token_id': None, 'forced_eos_token_id': None, 'remove_invalid_values': False, 'exponential_decay_length_penalty': None, 'suppress_tokens': None, 'begin_suppress_tokens': None, 'num_beam_groups': 1, 'diversity_penalty': 0.0, '_name_or_path': '', 'audio_end_token_id': 151670, 'model_type': 'qwen3_asr_thinker', 'tf_legacy_loss': False, 'use_bfloat16': False, 'user_token_id': 872, 'audio_start_token_id': 151669, 'initializer_range': 0.02, 'audio_config': {'return_dict': True, 'output_hidden_states': False, 'torchscript': False, 'dtype': None, 'pruned_heads': {}, 'tie_word_embeddings': True, 'chunk_size_feed_forward': 0, 'is_encoder_decoder': False, 'is_decoder': False, 'cross_attention_hidden_size': None, 'add_cross_attention': False, 'tie_encoder_decoder': False, 'architectures': None, 'finetuning_task': None, 'id2label': {0: 'LABEL_0', 1: 'LABEL_1'}, 'label2id': {'LABEL_0': 0, 'LABEL_1': 1}, 'task_specific_params': None, 'problem_type': None, 'tokenizer_class': None, 'prefix': None, 'bos_token_id': None, 'pad_token_id': None, 'eos_token_id': None, 'sep_token_id': None, 'decoder_start_token_id': None, 'max_length': 20, 'min_length': 0, 'do_sample': False, 'early_stopping': False, 'num_beams': 1, 'temperature': 1.0, 'top_k': 50, 'top_p': 1.0, 'typical_p': 1.0, 'repetition_penalty': 1.0, 'length_penalty': 1.0, 'no_repeat_ngram_size': 0, 'encoder_no_repeat_ngram_size': 0, 'bad_words_ids': None, 'num_return_sequences': 1, 'output_scores': False, 'return_dict_in_generate': False, 'forced_bos_token_id': None, 'forced_eos_token_id': None, 'remove_invalid_values': False, 'exponential_decay_length_penalty': None, 'suppress_tokens': None, 'begin_suppress_tokens': None, 'num_beam_groups': 1, 'diversity_penalty': 0.0, '_name_or_path': '', 'model_type': 'qwen3_asr_audio_encoder', 'num_hidden_layers': 24, 'tf_legacy_loss': False, 'use_bfloat16': False, 'num_mel_bins': 128, 'd_model': 1024, 'encoder_layers': 24, 'encoder_attention_heads': 16, 'encoder_ffn_dim': 4096, 'dropout': 0, 'attention_dropout': 0, 'activation_function': 'gelu', 'activation_dropout': 0, 'initializer_range': 0.02, 'scale_embedding': False, 'max_source_positions': 1500, 'n_window': 50, 'output_dim': 2048, 'n_window_infer': 800, 'conv_chunksize': 500, 'downsample_hidden_size': 480, 'output_attentions': False}, 'text_config': {'vocab_size': 151936, 'max_position_embeddings': 65536, 'hidden_size': 2048, 'intermediate_size': 6144, 'num_hidden_layers': 28, 'num_attention_heads': 16, 'num_key_value_heads': 8, 'head_dim': 128, 'hidden_act': 'silu', 'initializer_range': 0.02, 'rms_norm_eps': 1e-06, 'use_cache': False, 'rope_theta': 1000000, 'rope_scaling': {'interleaved': True, 'mrope_interleaved': True, 'mrope_section': [24, 20, 20], 'rope_type': 'default', 'type': 'default'}, 'attention_bias': False, 'attention_dropout': 0.0, 'return_dict': True, 'output_hidden_states': False, 'torchscript': False, 'dtype': None, 'pruned_heads': {}, 'tie_word_embeddings': True, 'chunk_size_feed_forward': 0, 'is_encoder_decoder': False, 'is_decoder': False, 'cross_attention_hidden_size': None, 'add_cross_attention': False, 'tie_encoder_decoder': False, 'architectures': None, 'finetuning_task': None, 'id2label': {0: 'LABEL_0', 1: 'LABEL_1'}, 'label2id': {'LABEL_0': 0, 'LABEL_1': 1}, 'task_specific_params': None, 'problem_type': None, 'tokenizer_class': None, 'prefix': None, 'bos_token_id': None, 'pad_token_id': 151643, 'eos_token_id': None, 'sep_token_id': None, 'decoder_start_token_id': None, 'max_length': 20, 'min_length': 0, 'do_sample': False, 'early_stopping': False, 'num_beams': 1, 'temperature': 1.0, 'top_k': 50, 'top_p': 1.0, 'typical_p': 1.0, 'repetition_penalty': 1.0, 'length_penalty': 1.0, 'no_repeat_ngram_size': 0, 'encoder_no_repeat_ngram_size': 0, 'bad_words_ids': None, 'num_return_sequences': 1, 'output_scores': False, 'return_dict_in_generate': False, 'forced_bos_token_id': None, 'forced_eos_token_id': None, 'remove_invalid_values': False, 'exponential_decay_length_penalty': None, 'suppress_tokens': None, 'begin_suppress_tokens': None, 'num_beam_groups': 1, 'diversity_penalty': 0.0, '_name_or_path': '', 'model_type': 'qwen3_asr_text', 'tf_legacy_loss': False, 'use_bfloat16': False, 'output_attentions': False}, 'audio_token_id': 151676, 'output_attentions': False}, 'support_languages': ['Chinese', 'English', 'Cantonese', 'Arabic', 'German', 'French', 'Spanish', 'Portuguese', 'Indonesian', 'Italian', 'Korean', 'Russian', 'Thai', 'Vietnamese', 'Japanese', 'Turkish', 'Hindi', 'Malay', 'Dutch', 'Swedish', 'Danish', 'Finnish', 'Polish', 'Czech', 'Filipino', 'Persian', 'Greek', 'Romanian', 'Hungarian', 'Macedonian'], 'output_attentions': False, 'output_dir': '/mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/0416upload/out/qwen3asr_dapo_reward56_4x4x12_12gen_4GPU/v3-20260417-123227', 'overwrite_output_dir': False, 'do_train': False, 'do_eval': True, 'do_predict': False, 'eval_strategy': 'steps', 'prediction_loss_only': False, 'per_device_train_batch_size': 8, 'per_device_eval_batch_size': 8, 'per_gpu_train_batch_size': None, 'per_gpu_eval_batch_size': None, 'gradient_accumulation_steps': 12, 'eval_accumulation_steps': None, 'eval_delay': 0, 'torch_empty_cache_steps': None, 'learning_rate': 5e-05, 'weight_decay': 0.1, 'adam_beta1': 0.9, 'adam_beta2': 0.95, 'adam_epsilon': 1e-08, 'max_grad_norm': 1.0, 'num_train_epochs': 3.0, 'max_steps': -1, 'lr_scheduler_type': 'cosine', 'lr_scheduler_kwargs': None, 'warmup_ratio': 0.03, 'warmup_steps': 0, 'log_level': 'passive', 'log_level_replica': 'warning', 'log_on_each_node': True, 'logging_dir': '/mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/0416upload/out/qwen3asr_dapo_reward56_4x4x12_12gen_4GPU/v3-20260417-123227/runs', 'logging_strategy': 'steps', 'logging_first_step': True, 'logging_steps': 5, 'logging_nan_inf_filter': True, 'save_strategy': 'steps', 'save_steps': 20, 'save_total_limit': None, 'save_safetensors': True, 'save_on_each_node': False, 'save_only_model': False, 'restore_callback_states_from_checkpoint': False, 'no_cuda': False, 'use_cpu': False, 'use_mps_device': False, 'seed': 42, 'data_seed': 42, 'jit_mode_eval': False, 'bf16': True, 'fp16': False, 'fp16_opt_level': 'O1', 'half_precision_backend': 'auto', 'bf16_full_eval': False, 'fp16_full_eval': False, 'tf32': None, 'local_rank': 0, 'ddp_backend': None, 'tpu_num_cores': None, 'tpu_metrics_debug': False, 'debug': [], 'dataloader_drop_last': True, 'eval_steps': 20, 'dataloader_num_workers': 1, 'dataloader_prefetch_factor': 2, 'past_index': -1, 'run_name': 'qwen3asr_dapo_reward56_4x4x12_12gen_4GPU', 'disable_tqdm': False, 'remove_unused_columns': False, 'label_names': None, 'load_best_model_at_end': False, 'metric_for_best_model': 'loss', 'greater_is_better': False, 'ignore_data_skip': False, 'fsdp': [], 'fsdp_min_num_params': 0, 'fsdp_config': {'min_num_params': 0, 'xla': False, 'xla_fsdp_v2': False, 'xla_fsdp_grad_ckpt': False}, 'fsdp_transformer_layer_cls_to_wrap': None, 'accelerator_config': {'split_batches': False, 'dispatch_batches': False, 'even_batches': True, 'use_seedable_sampler': True, 'non_blocking': False, 'gradient_accumulation_kwargs': None}, 'parallelism_config': None, 'deepspeed': None, 'label_smoothing_factor': 0.0, 'optim': 'adamw_torch', 'optim_args': None, 'adafactor': False, 'group_by_length': False, 'length_column_name': 'length', 'report_to': ['wandb'], 'project': 'huggingface', 'trackio_space_id': 'trackio', 'ddp_find_unused_parameters': None, 'ddp_bucket_cap_mb': None, 'ddp_broadcast_buffers': None, 'dataloader_pin_memory': True, 'dataloader_persistent_workers': False, 'skip_memory_metrics': True, 'use_legacy_prediction_loop': False, 'push_to_hub': False, 'resume_from_checkpoint': None, 'hub_model_id': None, 'hub_strategy': 'every_save', 'hub_token': '<HUB_TOKEN>', 'hub_private_repo': None, 'hub_always_push': False, 'hub_revision': None, 'gradient_checkpointing': False, 'gradient_checkpointing_kwargs': None, 'include_inputs_for_metrics': False, 'include_for_metrics': [], 'eval_do_concat_batches': True, 'fp16_backend': 'auto', 'push_to_hub_model_id': None, 'push_to_hub_organization': None, 'push_to_hub_token': '<PUSH_TO_HUB_TOKEN>', 'mp_parameters': '', 'auto_find_batch_size': False, 'full_determinism': False, 'torchdynamo': None, 'ray_scope': 'last', 'ddp_timeout': 18000000, 'torch_compile': False, 'torch_compile_backend': None, 'torch_compile_mode': None, 'include_tokens_per_second': False, 'include_num_input_tokens_seen': 'no', 'neftune_noise_alpha': None, 'optim_target_modules': None, 'batch_eval_metrics': False, 'eval_on_start': False, 'use_liger_kernel': False, 'liger_kernel_config': None, 'eval_use_gather_object': False, 'average_tokens_across_devices': True, 'model_init_kwargs': None, 'disable_dropout': False, 'cast_lm_head_to_fp32': False, 'num_generations': 12, 'num_generations_eval': 4, 'max_completion_length': 256, 'ds3_gather_for_generation': True, 'shuffle_dataset': True, 'generation_batch_size': 48, 'steps_per_generation': 3, 'min_p': None, 'generation_kwargs': None, 'chat_template_kwargs': None, 'use_transformers_paged': False, 'cache_implementation': None, 'use_vllm': False, 'vllm_mode': None, 'vllm_model_impl': 'vllm', 'vllm_enable_sleep_mode': False, 'vllm_structured_outputs_regex': None, 'vllm_server_base_url': None, 'vllm_server_host': None, 'vllm_server_port': [8000], 'vllm_server_timeout': 240.0, 'vllm_group_port': 51216, 'vllm_gpu_memory_utilization': 0.9, 'vllm_max_model_length': None, 'vllm_tensor_parallel_size': 1, 'beta': 0.04, 'num_iterations': 2, 'epsilon': 0.2, 'delta': None, 'epsilon_high': 0.28, 'sapo_temperature_neg': 1.05, 'sapo_temperature_pos': 1.0, 'importance_sampling_level': 'token', 'reward_weights': None, 'multi_objective_aggregation': 'sum_then_normalize', 'scale_rewards': 'group', 'loss_type': 'dapo', 'mask_truncated_completions': False, 'sync_ref_model': False, 'ref_model_mixup_alpha': 0.6, 'ref_model_sync_steps': 512, 'top_entropy_quantile': 1.0, 'max_tool_calling_iterations': None, 'vllm_importance_sampling_correction': True, 'vllm_importance_sampling_mode': 'sequence_mask', 'vllm_importance_sampling_cap': 3.0, 'off_policy_mask_threshold': None, 'use_bias_correction_kl': False, 'log_completions': True, 'num_completions_to_print': None, 'log_unique_prompts': False, 'log_completions_hub_repo': None, 'tuner_backend': 'peft', 'vit_gradient_checkpointing': True, 'router_aux_loss_coef': 0.0, 'enable_dft_loss': False, 'enable_channel_loss': False, 'safe_serialization': True, 'max_shard_size': '5GB', 'check_model': True, 'acc_strategy': 'token', 'train_dataloader_shuffle': True, 'max_epochs': None, 'aligner_lr': None, 'vit_lr': None, 'use_logits_to_keep': None, 'resume_only_model': False, 'optimizer': None, 'eval_metric': None, 'callbacks': [], 'early_stop_interval': None, 'eval_use_evalscope': False, 'eval_dataset': [], 'eval_dataset_args': None, 'eval_limit': None, 'eval_generation_config': None, 'extra_eval_args': None, 'tuner_type': 'lora', 'use_galore': False, 'galore_target_modules': None, 'galore_rank': 128, 'galore_update_proj_gap': 50, 'galore_scale': 1.0, 'galore_proj_type': 'std', 'galore_optim_per_parameter': False, 'galore_with_embedding': False, 'galore_quantization': False, 'galore_proj_quant': False, 'galore_proj_bits': 4, 'galore_proj_group_size': 256, 'galore_cos_threshold': 0.4, 'galore_gamma_proj': 2, 'galore_queue_size': 5, 'lisa_activated_layers': 0, 'lisa_step_interval': 20, 'use_flash_ckpt': False, 'vllm_pipeline_parallel_size': 1, 'vllm_enable_expert_parallel': False, 'vllm_max_num_seqs': None, 'vllm_max_model_len': None, 'vllm_disable_custom_all_reduce': True, 'vllm_enforce_eager': False, 'vllm_limit_mm_per_prompt': None, 'vllm_max_lora_rank': 16, 'vllm_enable_prefix_caching': True, 'vllm_use_async_engine': None, 'vllm_quantization': None, 'vllm_reasoning_parser': None, 'vllm_disable_cascade_attn': False, 'vllm_mm_processor_cache_gb': None, 'vllm_speculative_config': None, 'vllm_engine_kwargs': {}, 'vllm_data_parallel_size': 1, 'stop_words': [], 'vllm_enable_lora': False, 'lora_rank': 8, 'vllm_server_group_port': None, 'enable_flattened_weight_sync': True, 'async_generate': False, 'structured_outputs_regex': None, 'sleep_level': 0, 'move_model_batches': None, 'offload_optimizer': False, 'offload_model': False, 'wandb_log_unique_prompts': None, 'cosine_min_len_value_wrong': -0.5, 'cosine_max_len_value_wrong': 0.0, 'cosine_min_len_value_correct': 1.0, 'cosine_max_len_value_correct': 0.5, 'cosine_max_len': 256, 'repetition_n_grams': 3, 'repetition_max_penalty': -1.0, 'reward_model': None, 'reward_model_plugin': None, 'chord_sft_dataset': [], 'chord_sft_per_device_train_batch_size': None, 'chord_enable_phi_function': False, 'chord_mu_warmup_steps': None, 'chord_mu_decay_steps': None, 'chord_mu_peak': None, 'chord_mu_valley': None, 'multi_turn_scheduler': None, 'max_turns': None, 'completion_length_limit_scope': 'per_round', 'vllm_server_pass_dataset': False, 'dynamic_sample': True, 'max_resample_times': 4, 'overlong_filter': True, 'soft_max_length': None, 'soft_cache_length': None, 'log_entropy': False, 'tau_pos': 1.0, 'tau_neg': 1.05, 'advantage_estimator': 'grpo', 'kl_in_reward': False, 'dataset_shuffle': True, 'rollout_importance_sampling_mode': None, 'rollout_importance_sampling_threshold': 2.0, 'log_rollout_offpolicy_metrics': False, 'off_policy_sequence_mask_delta': None}
|
| 23 |
+
2026-04-17 12:32:39,959 INFO MainThread:26590 [wandb_config.py:__setitem__():154] [no run ID] config set model/num_parameters = 2050307712 - <bound method Run._config_callback of <wandb.sdk.wandb_run.Run object at 0x7f553c81a9e0>>
|
| 24 |
+
2026-04-17 12:32:39,959 INFO MainThread:26590 [wandb_run.py:_config_callback():1385] config_cb model/num_parameters 2050307712 None
|
| 25 |
+
2026-04-17 12:51:08,851 INFO wandb-AsyncioManager-main:26590 [service_client.py:_forward_responses():80] Reached EOF.
|
| 26 |
+
2026-04-17 12:51:08,851 INFO wandb-AsyncioManager-main:26590 [mailbox.py:close():137] Closing mailbox, abandoning 1 handles.
|
wandb/run-20260417_125349-3c0s7mq3/files/config.yaml
ADDED
|
@@ -0,0 +1,1273 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
_name_or_path:
|
| 2 |
+
value: /mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/qwen3-asr-merged
|
| 3 |
+
_wandb:
|
| 4 |
+
value:
|
| 5 |
+
cli_version: 0.23.0
|
| 6 |
+
e:
|
| 7 |
+
j5sm4ok14e8glxftszvcldkdpfaj9tjk:
|
| 8 |
+
args:
|
| 9 |
+
- --rlhf_type
|
| 10 |
+
- grpo
|
| 11 |
+
- --external_plugins
|
| 12 |
+
- /mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/0416upload/my_qwen3_asr_dapo_register.py
|
| 13 |
+
- /mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/0416upload/0417_reward.py
|
| 14 |
+
- --model
|
| 15 |
+
- /mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/qwen3-asr-merged
|
| 16 |
+
- --model_type
|
| 17 |
+
- my_qwen3_asr_rl
|
| 18 |
+
- --template
|
| 19 |
+
- my_qwen3_asr_rl
|
| 20 |
+
- --dataset
|
| 21 |
+
- /mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/0416upload/lora_0323_10w+55w+error+syn_with_domain_train90_targeted_rl_train90_loramerged_basewer_3suppress_server.jsonl
|
| 22 |
+
- --val_dataset
|
| 23 |
+
- /mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/0416upload/lora_0323_10w+55w+error+syn_with_domain_train90_targeted_rl_val5_sample5p_server.jsonl
|
| 24 |
+
- --reward_funcs
|
| 25 |
+
- asr_wer_sub_len_cmp_hallu_dirty_v56
|
| 26 |
+
- --train_type
|
| 27 |
+
- lora
|
| 28 |
+
- --use_vllm
|
| 29 |
+
- "false"
|
| 30 |
+
- --log_completions
|
| 31 |
+
- "true"
|
| 32 |
+
- --loss_type
|
| 33 |
+
- dapo
|
| 34 |
+
- --advantage_estimator
|
| 35 |
+
- grpo
|
| 36 |
+
- --scale_rewards
|
| 37 |
+
- group
|
| 38 |
+
- --num_iterations
|
| 39 |
+
- "2"
|
| 40 |
+
- --beta
|
| 41 |
+
- "0.04"
|
| 42 |
+
- --epsilon_high
|
| 43 |
+
- "0.28"
|
| 44 |
+
- --dynamic_sample
|
| 45 |
+
- "true"
|
| 46 |
+
- --max_resample_times
|
| 47 |
+
- "4"
|
| 48 |
+
- --overlong_filter
|
| 49 |
+
- "true"
|
| 50 |
+
- --truncation_strategy
|
| 51 |
+
- delete
|
| 52 |
+
- --num_generations
|
| 53 |
+
- "12"
|
| 54 |
+
- --generation_batch_size
|
| 55 |
+
- "48"
|
| 56 |
+
- --per_device_train_batch_size
|
| 57 |
+
- "4"
|
| 58 |
+
- --per_device_eval_batch_size
|
| 59 |
+
- "4"
|
| 60 |
+
- --gradient_accumulation_steps
|
| 61 |
+
- "12"
|
| 62 |
+
- --num_generations_eval
|
| 63 |
+
- "4"
|
| 64 |
+
- --max_completion_length
|
| 65 |
+
- "256"
|
| 66 |
+
- --temperature
|
| 67 |
+
- "0.50"
|
| 68 |
+
- --top_p
|
| 69 |
+
- "0.95"
|
| 70 |
+
- --top_k
|
| 71 |
+
- "50"
|
| 72 |
+
- --repetition_penalty
|
| 73 |
+
- "1.08"
|
| 74 |
+
- --learning_rate
|
| 75 |
+
- "5e-5"
|
| 76 |
+
- --lr_scheduler_type
|
| 77 |
+
- cosine
|
| 78 |
+
- --warmup_ratio
|
| 79 |
+
- "0.03"
|
| 80 |
+
- --report_to
|
| 81 |
+
- wandb
|
| 82 |
+
- --run_name
|
| 83 |
+
- qwen3asr_dapo_reward56_4x4x12_12gen_4GPU
|
| 84 |
+
- --output_dir
|
| 85 |
+
- /mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/0416upload/out/qwen3asr_dapo_reward56_4x4x12_12gen_4GPU
|
| 86 |
+
- --save_strategy
|
| 87 |
+
- steps
|
| 88 |
+
- --save_steps
|
| 89 |
+
- "20"
|
| 90 |
+
- --logging_steps
|
| 91 |
+
- "5"
|
| 92 |
+
- --freeze_llm
|
| 93 |
+
- "false"
|
| 94 |
+
- --freeze_vit
|
| 95 |
+
- "false"
|
| 96 |
+
- --freeze_aligner
|
| 97 |
+
- "false"
|
| 98 |
+
- --remove_unused_columns
|
| 99 |
+
- "false"
|
| 100 |
+
- --padding_side
|
| 101 |
+
- left
|
| 102 |
+
cpu_count: 64
|
| 103 |
+
cpu_count_logical: 128
|
| 104 |
+
cudaVersion: "12.4"
|
| 105 |
+
disk:
|
| 106 |
+
/:
|
| 107 |
+
total: "524945911808"
|
| 108 |
+
used: "49879580672"
|
| 109 |
+
email: pang_kaiyu@163.com
|
| 110 |
+
executable: /mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/bin/python3.10
|
| 111 |
+
gpu: NVIDIA A100-SXM4-80GB
|
| 112 |
+
gpu_count: 8
|
| 113 |
+
gpu_nvidia:
|
| 114 |
+
- architecture: Ampere
|
| 115 |
+
cudaCores: 6912
|
| 116 |
+
memoryTotal: "85899345920"
|
| 117 |
+
name: NVIDIA A100-SXM4-80GB
|
| 118 |
+
uuid: GPU-3da6624c-f6f7-fce6-4711-27acab73dc93
|
| 119 |
+
- architecture: Ampere
|
| 120 |
+
cudaCores: 6912
|
| 121 |
+
memoryTotal: "85899345920"
|
| 122 |
+
name: NVIDIA A100-SXM4-80GB
|
| 123 |
+
uuid: GPU-dae83544-a631-a3fe-b5d5-e4fdd056c7a8
|
| 124 |
+
- architecture: Ampere
|
| 125 |
+
cudaCores: 6912
|
| 126 |
+
memoryTotal: "85899345920"
|
| 127 |
+
name: NVIDIA A100-SXM4-80GB
|
| 128 |
+
uuid: GPU-621aa0b9-4a32-d349-8a16-20b8b6f0dde4
|
| 129 |
+
- architecture: Ampere
|
| 130 |
+
cudaCores: 6912
|
| 131 |
+
memoryTotal: "85899345920"
|
| 132 |
+
name: NVIDIA A100-SXM4-80GB
|
| 133 |
+
uuid: GPU-642bed5e-3bf1-b5e0-8aba-33f8f64a5dcc
|
| 134 |
+
- architecture: Ampere
|
| 135 |
+
cudaCores: 6912
|
| 136 |
+
memoryTotal: "85899345920"
|
| 137 |
+
name: NVIDIA A100-SXM4-80GB
|
| 138 |
+
uuid: GPU-6c70bd3b-1e58-bd2a-a10b-19891e3eab9a
|
| 139 |
+
- architecture: Ampere
|
| 140 |
+
cudaCores: 6912
|
| 141 |
+
memoryTotal: "85899345920"
|
| 142 |
+
name: NVIDIA A100-SXM4-80GB
|
| 143 |
+
uuid: GPU-96e9e2d3-6436-3c7f-5a20-1d4a32e7992c
|
| 144 |
+
- architecture: Ampere
|
| 145 |
+
cudaCores: 6912
|
| 146 |
+
memoryTotal: "85899345920"
|
| 147 |
+
name: NVIDIA A100-SXM4-80GB
|
| 148 |
+
uuid: GPU-dba7546f-0cda-e659-ca1d-4790c27ffe8d
|
| 149 |
+
- architecture: Ampere
|
| 150 |
+
cudaCores: 6912
|
| 151 |
+
memoryTotal: "85899345920"
|
| 152 |
+
name: NVIDIA A100-SXM4-80GB
|
| 153 |
+
uuid: GPU-b0a96cf9-74f3-969a-e8d0-5a30f3f06d1e
|
| 154 |
+
host: SH-IDC1-10-140-37-28
|
| 155 |
+
memory:
|
| 156 |
+
total: "1081627828224"
|
| 157 |
+
os: Linux-3.10.0-957.el7.x86_64-x86_64-with-glibc2.17
|
| 158 |
+
program: /mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/lib/python3.10/site-packages/swift/cli/rlhf.py
|
| 159 |
+
python: CPython 3.10.18
|
| 160 |
+
root: /mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/0416upload
|
| 161 |
+
slurm:
|
| 162 |
+
cluster_name: cluster_sproject3
|
| 163 |
+
conf: /etc/slurm/slurm.conf
|
| 164 |
+
cpus_on_node: "2"
|
| 165 |
+
gtids: "0"
|
| 166 |
+
job_account: research
|
| 167 |
+
job_cpus_per_node: "2"
|
| 168 |
+
job_gid: "800000689"
|
| 169 |
+
job_id: "8568855"
|
| 170 |
+
job_name: qwen3_asr_train_4gpu
|
| 171 |
+
job_nodelist: SH-IDC1-10-140-37-28
|
| 172 |
+
job_num_nodes: "1"
|
| 173 |
+
job_partition: interntmp
|
| 174 |
+
job_qos: normal
|
| 175 |
+
job_uid: "800000689"
|
| 176 |
+
job_user: panjiabao
|
| 177 |
+
jobid: "8568855"
|
| 178 |
+
launch_node_ipaddr: 10.140.37.164
|
| 179 |
+
localid: "0"
|
| 180 |
+
nnodes: "1"
|
| 181 |
+
nodeid: "0"
|
| 182 |
+
nodelist: SH-IDC1-10-140-37-28
|
| 183 |
+
nprocs: "1"
|
| 184 |
+
ntasks: "1"
|
| 185 |
+
ntasks_per_node: "1"
|
| 186 |
+
prio_process: "0"
|
| 187 |
+
procid: "0"
|
| 188 |
+
srun_comm_host: 10.140.37.164
|
| 189 |
+
srun_comm_port: "39944"
|
| 190 |
+
step_gpus: 4,5,6,7
|
| 191 |
+
step_id: "0"
|
| 192 |
+
step_launcher_port: "39944"
|
| 193 |
+
step_nodelist: SH-IDC1-10-140-37-28
|
| 194 |
+
step_num_nodes: "1"
|
| 195 |
+
step_num_tasks: "1"
|
| 196 |
+
step_tasks_per_node: "1"
|
| 197 |
+
stepid: "0"
|
| 198 |
+
submit_dir: /mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/0416upload
|
| 199 |
+
submit_host: SH-IDC1-10-140-37-164
|
| 200 |
+
task_pid: "253884"
|
| 201 |
+
tasks_per_node: "1"
|
| 202 |
+
topology_addr: SH-IDC1-10-140-37-28
|
| 203 |
+
topology_addr_pattern: node
|
| 204 |
+
umask: "0002"
|
| 205 |
+
working_cluster: cluster_sproject3:SH-IDC1-10-140-37-161:6817:9216:109
|
| 206 |
+
startedAt: "2026-04-17T04:53:49.174280Z"
|
| 207 |
+
writerId: j5sm4ok14e8glxftszvcldkdpfaj9tjk
|
| 208 |
+
m:
|
| 209 |
+
- "1": train/global_step
|
| 210 |
+
"6":
|
| 211 |
+
- 3
|
| 212 |
+
"7": []
|
| 213 |
+
- "2": '*'
|
| 214 |
+
"5": 1
|
| 215 |
+
"6":
|
| 216 |
+
- 1
|
| 217 |
+
"7": []
|
| 218 |
+
python_version: 3.10.18
|
| 219 |
+
t:
|
| 220 |
+
"1":
|
| 221 |
+
- 1
|
| 222 |
+
- 5
|
| 223 |
+
- 11
|
| 224 |
+
- 30
|
| 225 |
+
- 41
|
| 226 |
+
- 49
|
| 227 |
+
- 51
|
| 228 |
+
- 53
|
| 229 |
+
- 71
|
| 230 |
+
- 84
|
| 231 |
+
- 95
|
| 232 |
+
- 98
|
| 233 |
+
- 105
|
| 234 |
+
"2":
|
| 235 |
+
- 1
|
| 236 |
+
- 5
|
| 237 |
+
- 11
|
| 238 |
+
- 30
|
| 239 |
+
- 41
|
| 240 |
+
- 49
|
| 241 |
+
- 51
|
| 242 |
+
- 53
|
| 243 |
+
- 71
|
| 244 |
+
- 84
|
| 245 |
+
- 95
|
| 246 |
+
- 98
|
| 247 |
+
- 105
|
| 248 |
+
"3":
|
| 249 |
+
- 7
|
| 250 |
+
- 13
|
| 251 |
+
- 19
|
| 252 |
+
- 66
|
| 253 |
+
"4": 3.10.18
|
| 254 |
+
"5": 0.23.0
|
| 255 |
+
"6": 4.57.6
|
| 256 |
+
"9":
|
| 257 |
+
"1": transformers_trainer
|
| 258 |
+
"12": 0.23.0
|
| 259 |
+
"13": linux-x86_64
|
| 260 |
+
acc_strategy:
|
| 261 |
+
value: token
|
| 262 |
+
accelerator_config:
|
| 263 |
+
value:
|
| 264 |
+
dispatch_batches: false
|
| 265 |
+
even_batches: true
|
| 266 |
+
gradient_accumulation_kwargs: null
|
| 267 |
+
non_blocking: false
|
| 268 |
+
split_batches: false
|
| 269 |
+
use_seedable_sampler: true
|
| 270 |
+
adafactor:
|
| 271 |
+
value: false
|
| 272 |
+
adam_beta1:
|
| 273 |
+
value: 0.9
|
| 274 |
+
adam_beta2:
|
| 275 |
+
value: 0.95
|
| 276 |
+
adam_epsilon:
|
| 277 |
+
value: 1e-08
|
| 278 |
+
add_cross_attention:
|
| 279 |
+
value: false
|
| 280 |
+
advantage_estimator:
|
| 281 |
+
value: grpo
|
| 282 |
+
aligner_lr:
|
| 283 |
+
value: null
|
| 284 |
+
architectures:
|
| 285 |
+
value:
|
| 286 |
+
- Qwen3ASRForConditionalGeneration
|
| 287 |
+
async_generate:
|
| 288 |
+
value: false
|
| 289 |
+
auto_find_batch_size:
|
| 290 |
+
value: false
|
| 291 |
+
average_tokens_across_devices:
|
| 292 |
+
value: true
|
| 293 |
+
bad_words_ids:
|
| 294 |
+
value: null
|
| 295 |
+
batch_eval_metrics:
|
| 296 |
+
value: false
|
| 297 |
+
begin_suppress_tokens:
|
| 298 |
+
value: null
|
| 299 |
+
beta:
|
| 300 |
+
value: 0.04
|
| 301 |
+
bf16:
|
| 302 |
+
value: true
|
| 303 |
+
bf16_full_eval:
|
| 304 |
+
value: false
|
| 305 |
+
bos_token_id:
|
| 306 |
+
value: null
|
| 307 |
+
cache_implementation:
|
| 308 |
+
value: null
|
| 309 |
+
callbacks:
|
| 310 |
+
value: []
|
| 311 |
+
cast_lm_head_to_fp32:
|
| 312 |
+
value: false
|
| 313 |
+
chat_template_kwargs:
|
| 314 |
+
value: null
|
| 315 |
+
check_model:
|
| 316 |
+
value: true
|
| 317 |
+
chord_enable_phi_function:
|
| 318 |
+
value: false
|
| 319 |
+
chord_mu_decay_steps:
|
| 320 |
+
value: null
|
| 321 |
+
chord_mu_peak:
|
| 322 |
+
value: null
|
| 323 |
+
chord_mu_valley:
|
| 324 |
+
value: null
|
| 325 |
+
chord_mu_warmup_steps:
|
| 326 |
+
value: null
|
| 327 |
+
chord_sft_dataset:
|
| 328 |
+
value: []
|
| 329 |
+
chord_sft_per_device_train_batch_size:
|
| 330 |
+
value: null
|
| 331 |
+
chunk_size_feed_forward:
|
| 332 |
+
value: 0
|
| 333 |
+
completion_length_limit_scope:
|
| 334 |
+
value: per_round
|
| 335 |
+
cosine_max_len:
|
| 336 |
+
value: 256
|
| 337 |
+
cosine_max_len_value_correct:
|
| 338 |
+
value: 0.5
|
| 339 |
+
cosine_max_len_value_wrong:
|
| 340 |
+
value: 0
|
| 341 |
+
cosine_min_len_value_correct:
|
| 342 |
+
value: 1
|
| 343 |
+
cosine_min_len_value_wrong:
|
| 344 |
+
value: -0.5
|
| 345 |
+
cross_attention_hidden_size:
|
| 346 |
+
value: null
|
| 347 |
+
data_seed:
|
| 348 |
+
value: 42
|
| 349 |
+
dataloader_drop_last:
|
| 350 |
+
value: true
|
| 351 |
+
dataloader_num_workers:
|
| 352 |
+
value: 1
|
| 353 |
+
dataloader_persistent_workers:
|
| 354 |
+
value: false
|
| 355 |
+
dataloader_pin_memory:
|
| 356 |
+
value: true
|
| 357 |
+
dataloader_prefetch_factor:
|
| 358 |
+
value: 2
|
| 359 |
+
dataset_shuffle:
|
| 360 |
+
value: true
|
| 361 |
+
ddp_backend:
|
| 362 |
+
value: null
|
| 363 |
+
ddp_broadcast_buffers:
|
| 364 |
+
value: null
|
| 365 |
+
ddp_bucket_cap_mb:
|
| 366 |
+
value: null
|
| 367 |
+
ddp_find_unused_parameters:
|
| 368 |
+
value: null
|
| 369 |
+
ddp_timeout:
|
| 370 |
+
value: 18000000
|
| 371 |
+
debug:
|
| 372 |
+
value: []
|
| 373 |
+
decoder_start_token_id:
|
| 374 |
+
value: null
|
| 375 |
+
deepspeed:
|
| 376 |
+
value: null
|
| 377 |
+
delta:
|
| 378 |
+
value: null
|
| 379 |
+
disable_dropout:
|
| 380 |
+
value: false
|
| 381 |
+
disable_tqdm:
|
| 382 |
+
value: false
|
| 383 |
+
diversity_penalty:
|
| 384 |
+
value: 0
|
| 385 |
+
do_eval:
|
| 386 |
+
value: true
|
| 387 |
+
do_predict:
|
| 388 |
+
value: false
|
| 389 |
+
do_sample:
|
| 390 |
+
value: false
|
| 391 |
+
do_train:
|
| 392 |
+
value: false
|
| 393 |
+
ds3_gather_for_generation:
|
| 394 |
+
value: true
|
| 395 |
+
dtype:
|
| 396 |
+
value: bfloat16
|
| 397 |
+
dynamic_sample:
|
| 398 |
+
value: true
|
| 399 |
+
early_stop_interval:
|
| 400 |
+
value: null
|
| 401 |
+
early_stopping:
|
| 402 |
+
value: false
|
| 403 |
+
enable_channel_loss:
|
| 404 |
+
value: false
|
| 405 |
+
enable_dft_loss:
|
| 406 |
+
value: false
|
| 407 |
+
enable_flattened_weight_sync:
|
| 408 |
+
value: true
|
| 409 |
+
encoder_no_repeat_ngram_size:
|
| 410 |
+
value: 0
|
| 411 |
+
eos_token_id:
|
| 412 |
+
value: 151645
|
| 413 |
+
epsilon:
|
| 414 |
+
value: 0.2
|
| 415 |
+
epsilon_high:
|
| 416 |
+
value: 0.28
|
| 417 |
+
eval_accumulation_steps:
|
| 418 |
+
value: null
|
| 419 |
+
eval_dataset:
|
| 420 |
+
value: []
|
| 421 |
+
eval_dataset_args:
|
| 422 |
+
value: null
|
| 423 |
+
eval_delay:
|
| 424 |
+
value: 0
|
| 425 |
+
eval_do_concat_batches:
|
| 426 |
+
value: true
|
| 427 |
+
eval_generation_config:
|
| 428 |
+
value: null
|
| 429 |
+
eval_limit:
|
| 430 |
+
value: null
|
| 431 |
+
eval_metric:
|
| 432 |
+
value: null
|
| 433 |
+
eval_on_start:
|
| 434 |
+
value: false
|
| 435 |
+
eval_steps:
|
| 436 |
+
value: 20
|
| 437 |
+
eval_strategy:
|
| 438 |
+
value: steps
|
| 439 |
+
eval_use_evalscope:
|
| 440 |
+
value: false
|
| 441 |
+
eval_use_gather_object:
|
| 442 |
+
value: false
|
| 443 |
+
exponential_decay_length_penalty:
|
| 444 |
+
value: null
|
| 445 |
+
extra_eval_args:
|
| 446 |
+
value: null
|
| 447 |
+
finetuning_task:
|
| 448 |
+
value: null
|
| 449 |
+
forced_bos_token_id:
|
| 450 |
+
value: null
|
| 451 |
+
forced_eos_token_id:
|
| 452 |
+
value: null
|
| 453 |
+
fp16:
|
| 454 |
+
value: false
|
| 455 |
+
fp16_backend:
|
| 456 |
+
value: auto
|
| 457 |
+
fp16_full_eval:
|
| 458 |
+
value: false
|
| 459 |
+
fp16_opt_level:
|
| 460 |
+
value: O1
|
| 461 |
+
fsdp:
|
| 462 |
+
value: []
|
| 463 |
+
fsdp_config:
|
| 464 |
+
value:
|
| 465 |
+
min_num_params: 0
|
| 466 |
+
xla: false
|
| 467 |
+
xla_fsdp_grad_ckpt: false
|
| 468 |
+
xla_fsdp_v2: false
|
| 469 |
+
fsdp_min_num_params:
|
| 470 |
+
value: 0
|
| 471 |
+
fsdp_transformer_layer_cls_to_wrap:
|
| 472 |
+
value: null
|
| 473 |
+
full_determinism:
|
| 474 |
+
value: false
|
| 475 |
+
galore_cos_threshold:
|
| 476 |
+
value: 0.4
|
| 477 |
+
galore_gamma_proj:
|
| 478 |
+
value: 2
|
| 479 |
+
galore_optim_per_parameter:
|
| 480 |
+
value: false
|
| 481 |
+
galore_proj_bits:
|
| 482 |
+
value: 4
|
| 483 |
+
galore_proj_group_size:
|
| 484 |
+
value: 256
|
| 485 |
+
galore_proj_quant:
|
| 486 |
+
value: false
|
| 487 |
+
galore_proj_type:
|
| 488 |
+
value: std
|
| 489 |
+
galore_quantization:
|
| 490 |
+
value: false
|
| 491 |
+
galore_queue_size:
|
| 492 |
+
value: 5
|
| 493 |
+
galore_rank:
|
| 494 |
+
value: 128
|
| 495 |
+
galore_scale:
|
| 496 |
+
value: 1
|
| 497 |
+
galore_target_modules:
|
| 498 |
+
value: null
|
| 499 |
+
galore_update_proj_gap:
|
| 500 |
+
value: 50
|
| 501 |
+
galore_with_embedding:
|
| 502 |
+
value: false
|
| 503 |
+
generation_batch_size:
|
| 504 |
+
value: 48
|
| 505 |
+
generation_kwargs:
|
| 506 |
+
value: null
|
| 507 |
+
gradient_accumulation_steps:
|
| 508 |
+
value: 12
|
| 509 |
+
gradient_checkpointing:
|
| 510 |
+
value: false
|
| 511 |
+
gradient_checkpointing_kwargs:
|
| 512 |
+
value: null
|
| 513 |
+
greater_is_better:
|
| 514 |
+
value: false
|
| 515 |
+
group_by_length:
|
| 516 |
+
value: false
|
| 517 |
+
half_precision_backend:
|
| 518 |
+
value: auto
|
| 519 |
+
hub_always_push:
|
| 520 |
+
value: false
|
| 521 |
+
hub_model_id:
|
| 522 |
+
value: null
|
| 523 |
+
hub_private_repo:
|
| 524 |
+
value: null
|
| 525 |
+
hub_revision:
|
| 526 |
+
value: null
|
| 527 |
+
hub_strategy:
|
| 528 |
+
value: every_save
|
| 529 |
+
hub_token:
|
| 530 |
+
value: <HUB_TOKEN>
|
| 531 |
+
id2label:
|
| 532 |
+
value:
|
| 533 |
+
"0": LABEL_0
|
| 534 |
+
"1": LABEL_1
|
| 535 |
+
ignore_data_skip:
|
| 536 |
+
value: false
|
| 537 |
+
importance_sampling_level:
|
| 538 |
+
value: token
|
| 539 |
+
include_for_metrics:
|
| 540 |
+
value: []
|
| 541 |
+
include_inputs_for_metrics:
|
| 542 |
+
value: false
|
| 543 |
+
include_num_input_tokens_seen:
|
| 544 |
+
value: "no"
|
| 545 |
+
include_tokens_per_second:
|
| 546 |
+
value: false
|
| 547 |
+
is_decoder:
|
| 548 |
+
value: false
|
| 549 |
+
is_encoder_decoder:
|
| 550 |
+
value: false
|
| 551 |
+
jit_mode_eval:
|
| 552 |
+
value: false
|
| 553 |
+
kl_in_reward:
|
| 554 |
+
value: false
|
| 555 |
+
label_names:
|
| 556 |
+
value: null
|
| 557 |
+
label_smoothing_factor:
|
| 558 |
+
value: 0
|
| 559 |
+
label2id:
|
| 560 |
+
value:
|
| 561 |
+
LABEL_0: 0
|
| 562 |
+
LABEL_1: 1
|
| 563 |
+
learning_rate:
|
| 564 |
+
value: 5e-05
|
| 565 |
+
length_column_name:
|
| 566 |
+
value: length
|
| 567 |
+
length_penalty:
|
| 568 |
+
value: 1
|
| 569 |
+
liger_kernel_config:
|
| 570 |
+
value: null
|
| 571 |
+
lisa_activated_layers:
|
| 572 |
+
value: 0
|
| 573 |
+
lisa_step_interval:
|
| 574 |
+
value: 20
|
| 575 |
+
load_best_model_at_end:
|
| 576 |
+
value: false
|
| 577 |
+
local_rank:
|
| 578 |
+
value: 0
|
| 579 |
+
log_completions:
|
| 580 |
+
value: true
|
| 581 |
+
log_completions_hub_repo:
|
| 582 |
+
value: null
|
| 583 |
+
log_entropy:
|
| 584 |
+
value: false
|
| 585 |
+
log_level:
|
| 586 |
+
value: passive
|
| 587 |
+
log_level_replica:
|
| 588 |
+
value: warning
|
| 589 |
+
log_on_each_node:
|
| 590 |
+
value: true
|
| 591 |
+
log_rollout_offpolicy_metrics:
|
| 592 |
+
value: false
|
| 593 |
+
log_unique_prompts:
|
| 594 |
+
value: false
|
| 595 |
+
logging_dir:
|
| 596 |
+
value: /mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/0416upload/out/qwen3asr_dapo_reward56_4x4x12_12gen_4GPU/v4-20260417-125332/runs
|
| 597 |
+
logging_first_step:
|
| 598 |
+
value: true
|
| 599 |
+
logging_nan_inf_filter:
|
| 600 |
+
value: true
|
| 601 |
+
logging_steps:
|
| 602 |
+
value: 5
|
| 603 |
+
logging_strategy:
|
| 604 |
+
value: steps
|
| 605 |
+
lora_rank:
|
| 606 |
+
value: 8
|
| 607 |
+
loss_type:
|
| 608 |
+
value: dapo
|
| 609 |
+
lr_scheduler_kwargs:
|
| 610 |
+
value: null
|
| 611 |
+
lr_scheduler_type:
|
| 612 |
+
value: cosine
|
| 613 |
+
mask_truncated_completions:
|
| 614 |
+
value: false
|
| 615 |
+
max_completion_length:
|
| 616 |
+
value: 256
|
| 617 |
+
max_epochs:
|
| 618 |
+
value: null
|
| 619 |
+
max_grad_norm:
|
| 620 |
+
value: 1
|
| 621 |
+
max_length:
|
| 622 |
+
value: 20
|
| 623 |
+
max_resample_times:
|
| 624 |
+
value: 4
|
| 625 |
+
max_shard_size:
|
| 626 |
+
value: 5GB
|
| 627 |
+
max_steps:
|
| 628 |
+
value: -1
|
| 629 |
+
max_tool_calling_iterations:
|
| 630 |
+
value: null
|
| 631 |
+
max_turns:
|
| 632 |
+
value: null
|
| 633 |
+
metric_for_best_model:
|
| 634 |
+
value: loss
|
| 635 |
+
min_length:
|
| 636 |
+
value: 0
|
| 637 |
+
min_p:
|
| 638 |
+
value: null
|
| 639 |
+
model/num_parameters:
|
| 640 |
+
value: 2050307712
|
| 641 |
+
model_init_kwargs:
|
| 642 |
+
value: null
|
| 643 |
+
model_type:
|
| 644 |
+
value: qwen3_asr
|
| 645 |
+
move_model_batches:
|
| 646 |
+
value: null
|
| 647 |
+
mp_parameters:
|
| 648 |
+
value: ""
|
| 649 |
+
multi_objective_aggregation:
|
| 650 |
+
value: sum_then_normalize
|
| 651 |
+
multi_turn_scheduler:
|
| 652 |
+
value: null
|
| 653 |
+
neftune_noise_alpha:
|
| 654 |
+
value: null
|
| 655 |
+
no_cuda:
|
| 656 |
+
value: false
|
| 657 |
+
no_repeat_ngram_size:
|
| 658 |
+
value: 0
|
| 659 |
+
num_beam_groups:
|
| 660 |
+
value: 1
|
| 661 |
+
num_beams:
|
| 662 |
+
value: 1
|
| 663 |
+
num_completions_to_print:
|
| 664 |
+
value: null
|
| 665 |
+
num_generations:
|
| 666 |
+
value: 12
|
| 667 |
+
num_generations_eval:
|
| 668 |
+
value: 4
|
| 669 |
+
num_iterations:
|
| 670 |
+
value: 2
|
| 671 |
+
num_return_sequences:
|
| 672 |
+
value: 1
|
| 673 |
+
num_train_epochs:
|
| 674 |
+
value: 3
|
| 675 |
+
off_policy_mask_threshold:
|
| 676 |
+
value: null
|
| 677 |
+
off_policy_sequence_mask_delta:
|
| 678 |
+
value: null
|
| 679 |
+
offload_model:
|
| 680 |
+
value: false
|
| 681 |
+
offload_optimizer:
|
| 682 |
+
value: false
|
| 683 |
+
optim:
|
| 684 |
+
value: adamw_torch
|
| 685 |
+
optim_args:
|
| 686 |
+
value: null
|
| 687 |
+
optim_target_modules:
|
| 688 |
+
value: null
|
| 689 |
+
optimizer:
|
| 690 |
+
value: null
|
| 691 |
+
output_attentions:
|
| 692 |
+
value: false
|
| 693 |
+
output_dir:
|
| 694 |
+
value: /mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/0416upload/out/qwen3asr_dapo_reward56_4x4x12_12gen_4GPU/v4-20260417-125332
|
| 695 |
+
output_hidden_states:
|
| 696 |
+
value: false
|
| 697 |
+
output_scores:
|
| 698 |
+
value: false
|
| 699 |
+
overlong_filter:
|
| 700 |
+
value: true
|
| 701 |
+
overwrite_output_dir:
|
| 702 |
+
value: false
|
| 703 |
+
pad_token_id:
|
| 704 |
+
value: 151643
|
| 705 |
+
parallelism_config:
|
| 706 |
+
value: null
|
| 707 |
+
past_index:
|
| 708 |
+
value: -1
|
| 709 |
+
peft_config:
|
| 710 |
+
value:
|
| 711 |
+
default:
|
| 712 |
+
alora_invocation_tokens: null
|
| 713 |
+
arrow_config: null
|
| 714 |
+
auto_mapping: null
|
| 715 |
+
base_model_name_or_path: /mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/qwen3-asr-merged
|
| 716 |
+
bias: none
|
| 717 |
+
corda_config: null
|
| 718 |
+
ensure_weight_tying: false
|
| 719 |
+
eva_config: null
|
| 720 |
+
exclude_modules: null
|
| 721 |
+
fan_in_fan_out: false
|
| 722 |
+
inference_mode: false
|
| 723 |
+
init_lora_weights: true
|
| 724 |
+
layer_replication: null
|
| 725 |
+
layers_pattern: null
|
| 726 |
+
layers_to_transform: null
|
| 727 |
+
lora_alpha: 32
|
| 728 |
+
lora_bias: false
|
| 729 |
+
lora_dropout: 0.05
|
| 730 |
+
lora_dtype: null
|
| 731 |
+
lorap_emb_lr: 1e-06
|
| 732 |
+
lorap_lr_ratio: null
|
| 733 |
+
megatron_config: null
|
| 734 |
+
megatron_core: megatron.core
|
| 735 |
+
modules_to_save: []
|
| 736 |
+
peft_type: LORA
|
| 737 |
+
peft_version: 0.18.1
|
| 738 |
+
qalora_group_size: 16
|
| 739 |
+
r: 8
|
| 740 |
+
revision: null
|
| 741 |
+
runtime_config:
|
| 742 |
+
ephemeral_gpu_offload: false
|
| 743 |
+
target_modules: ^(thinker\.model(?=\.).*\.(k_proj|q_proj|down_proj|up_proj|v_proj|gate_proj|o_proj)|thinker\.audio_tower\.layers(?=\.).*\.(k_proj|fc1|fc2|q_proj|out_proj|v_proj)|thinker\.audio_tower\.conv_out(?=\.)|thinker\.audio_tower\.proj1(?=\.)|thinker\.audio_tower\.proj2(?=\.))$
|
| 744 |
+
target_parameters: null
|
| 745 |
+
task_type: CAUSAL_LM
|
| 746 |
+
trainable_token_indices: null
|
| 747 |
+
use_dora: false
|
| 748 |
+
use_qalora: false
|
| 749 |
+
use_rslora: false
|
| 750 |
+
per_device_eval_batch_size:
|
| 751 |
+
value: 4
|
| 752 |
+
per_device_train_batch_size:
|
| 753 |
+
value: 4
|
| 754 |
+
per_gpu_eval_batch_size:
|
| 755 |
+
value: null
|
| 756 |
+
per_gpu_train_batch_size:
|
| 757 |
+
value: null
|
| 758 |
+
prediction_loss_only:
|
| 759 |
+
value: false
|
| 760 |
+
prefix:
|
| 761 |
+
value: null
|
| 762 |
+
problem_type:
|
| 763 |
+
value: null
|
| 764 |
+
project:
|
| 765 |
+
value: huggingface
|
| 766 |
+
push_to_hub:
|
| 767 |
+
value: false
|
| 768 |
+
push_to_hub_model_id:
|
| 769 |
+
value: null
|
| 770 |
+
push_to_hub_organization:
|
| 771 |
+
value: null
|
| 772 |
+
push_to_hub_token:
|
| 773 |
+
value: <PUSH_TO_HUB_TOKEN>
|
| 774 |
+
ray_scope:
|
| 775 |
+
value: last
|
| 776 |
+
ref_model_mixup_alpha:
|
| 777 |
+
value: 0.6
|
| 778 |
+
ref_model_sync_steps:
|
| 779 |
+
value: 512
|
| 780 |
+
remove_invalid_values:
|
| 781 |
+
value: false
|
| 782 |
+
remove_unused_columns:
|
| 783 |
+
value: false
|
| 784 |
+
repetition_max_penalty:
|
| 785 |
+
value: -1
|
| 786 |
+
repetition_n_grams:
|
| 787 |
+
value: 3
|
| 788 |
+
repetition_penalty:
|
| 789 |
+
value: 1.08
|
| 790 |
+
report_to:
|
| 791 |
+
value:
|
| 792 |
+
- wandb
|
| 793 |
+
restore_callback_states_from_checkpoint:
|
| 794 |
+
value: false
|
| 795 |
+
resume_from_checkpoint:
|
| 796 |
+
value: null
|
| 797 |
+
resume_only_model:
|
| 798 |
+
value: false
|
| 799 |
+
return_dict:
|
| 800 |
+
value: true
|
| 801 |
+
return_dict_in_generate:
|
| 802 |
+
value: false
|
| 803 |
+
reward_model:
|
| 804 |
+
value: null
|
| 805 |
+
reward_model_plugin:
|
| 806 |
+
value: null
|
| 807 |
+
reward_weights:
|
| 808 |
+
value: null
|
| 809 |
+
rollout_importance_sampling_mode:
|
| 810 |
+
value: null
|
| 811 |
+
rollout_importance_sampling_threshold:
|
| 812 |
+
value: 2
|
| 813 |
+
router_aux_loss_coef:
|
| 814 |
+
value: 0
|
| 815 |
+
run_name:
|
| 816 |
+
value: qwen3asr_dapo_reward56_4x4x12_12gen_4GPU
|
| 817 |
+
safe_serialization:
|
| 818 |
+
value: true
|
| 819 |
+
sapo_temperature_neg:
|
| 820 |
+
value: 1.05
|
| 821 |
+
sapo_temperature_pos:
|
| 822 |
+
value: 1
|
| 823 |
+
save_on_each_node:
|
| 824 |
+
value: false
|
| 825 |
+
save_only_model:
|
| 826 |
+
value: false
|
| 827 |
+
save_safetensors:
|
| 828 |
+
value: true
|
| 829 |
+
save_steps:
|
| 830 |
+
value: 20
|
| 831 |
+
save_strategy:
|
| 832 |
+
value: steps
|
| 833 |
+
save_total_limit:
|
| 834 |
+
value: null
|
| 835 |
+
scale_rewards:
|
| 836 |
+
value: group
|
| 837 |
+
seed:
|
| 838 |
+
value: 42
|
| 839 |
+
sep_token_id:
|
| 840 |
+
value: null
|
| 841 |
+
shuffle_dataset:
|
| 842 |
+
value: true
|
| 843 |
+
skip_memory_metrics:
|
| 844 |
+
value: true
|
| 845 |
+
sleep_level:
|
| 846 |
+
value: 0
|
| 847 |
+
soft_cache_length:
|
| 848 |
+
value: null
|
| 849 |
+
soft_max_length:
|
| 850 |
+
value: null
|
| 851 |
+
steps_per_generation:
|
| 852 |
+
value: 3
|
| 853 |
+
stop_words:
|
| 854 |
+
value: []
|
| 855 |
+
structured_outputs_regex:
|
| 856 |
+
value: null
|
| 857 |
+
support_languages:
|
| 858 |
+
value:
|
| 859 |
+
- Chinese
|
| 860 |
+
- English
|
| 861 |
+
- Cantonese
|
| 862 |
+
- Arabic
|
| 863 |
+
- German
|
| 864 |
+
- French
|
| 865 |
+
- Spanish
|
| 866 |
+
- Portuguese
|
| 867 |
+
- Indonesian
|
| 868 |
+
- Italian
|
| 869 |
+
- Korean
|
| 870 |
+
- Russian
|
| 871 |
+
- Thai
|
| 872 |
+
- Vietnamese
|
| 873 |
+
- Japanese
|
| 874 |
+
- Turkish
|
| 875 |
+
- Hindi
|
| 876 |
+
- Malay
|
| 877 |
+
- Dutch
|
| 878 |
+
- Swedish
|
| 879 |
+
- Danish
|
| 880 |
+
- Finnish
|
| 881 |
+
- Polish
|
| 882 |
+
- Czech
|
| 883 |
+
- Filipino
|
| 884 |
+
- Persian
|
| 885 |
+
- Greek
|
| 886 |
+
- Romanian
|
| 887 |
+
- Hungarian
|
| 888 |
+
- Macedonian
|
| 889 |
+
suppress_tokens:
|
| 890 |
+
value: null
|
| 891 |
+
sync_ref_model:
|
| 892 |
+
value: false
|
| 893 |
+
task_specific_params:
|
| 894 |
+
value: null
|
| 895 |
+
tau_neg:
|
| 896 |
+
value: 1.05
|
| 897 |
+
tau_pos:
|
| 898 |
+
value: 1
|
| 899 |
+
temperature:
|
| 900 |
+
value: 0.5
|
| 901 |
+
tf_legacy_loss:
|
| 902 |
+
value: false
|
| 903 |
+
tf32:
|
| 904 |
+
value: null
|
| 905 |
+
thinker_config:
|
| 906 |
+
value:
|
| 907 |
+
_name_or_path: ""
|
| 908 |
+
add_cross_attention: false
|
| 909 |
+
architectures:
|
| 910 |
+
- Qwen3ASRForConditionalGeneration
|
| 911 |
+
audio_config:
|
| 912 |
+
_name_or_path: ""
|
| 913 |
+
activation_dropout: 0
|
| 914 |
+
activation_function: gelu
|
| 915 |
+
add_cross_attention: false
|
| 916 |
+
architectures: null
|
| 917 |
+
attention_dropout: 0
|
| 918 |
+
bad_words_ids: null
|
| 919 |
+
begin_suppress_tokens: null
|
| 920 |
+
bos_token_id: null
|
| 921 |
+
chunk_size_feed_forward: 0
|
| 922 |
+
conv_chunksize: 500
|
| 923 |
+
cross_attention_hidden_size: null
|
| 924 |
+
d_model: 1024
|
| 925 |
+
decoder_start_token_id: null
|
| 926 |
+
diversity_penalty: 0
|
| 927 |
+
do_sample: false
|
| 928 |
+
downsample_hidden_size: 480
|
| 929 |
+
dropout: 0
|
| 930 |
+
dtype: null
|
| 931 |
+
early_stopping: false
|
| 932 |
+
encoder_attention_heads: 16
|
| 933 |
+
encoder_ffn_dim: 4096
|
| 934 |
+
encoder_layers: 24
|
| 935 |
+
encoder_no_repeat_ngram_size: 0
|
| 936 |
+
eos_token_id: null
|
| 937 |
+
exponential_decay_length_penalty: null
|
| 938 |
+
finetuning_task: null
|
| 939 |
+
forced_bos_token_id: null
|
| 940 |
+
forced_eos_token_id: null
|
| 941 |
+
id2label:
|
| 942 |
+
"0": LABEL_0
|
| 943 |
+
"1": LABEL_1
|
| 944 |
+
initializer_range: 0.02
|
| 945 |
+
is_decoder: false
|
| 946 |
+
is_encoder_decoder: false
|
| 947 |
+
label2id:
|
| 948 |
+
LABEL_0: 0
|
| 949 |
+
LABEL_1: 1
|
| 950 |
+
length_penalty: 1
|
| 951 |
+
max_length: 20
|
| 952 |
+
max_source_positions: 1500
|
| 953 |
+
min_length: 0
|
| 954 |
+
model_type: qwen3_asr_audio_encoder
|
| 955 |
+
n_window: 50
|
| 956 |
+
n_window_infer: 800
|
| 957 |
+
no_repeat_ngram_size: 0
|
| 958 |
+
num_beam_groups: 1
|
| 959 |
+
num_beams: 1
|
| 960 |
+
num_hidden_layers: 24
|
| 961 |
+
num_mel_bins: 128
|
| 962 |
+
num_return_sequences: 1
|
| 963 |
+
output_attentions: false
|
| 964 |
+
output_dim: 2048
|
| 965 |
+
output_hidden_states: false
|
| 966 |
+
output_scores: false
|
| 967 |
+
pad_token_id: null
|
| 968 |
+
prefix: null
|
| 969 |
+
problem_type: null
|
| 970 |
+
remove_invalid_values: false
|
| 971 |
+
repetition_penalty: 1
|
| 972 |
+
return_dict: true
|
| 973 |
+
return_dict_in_generate: false
|
| 974 |
+
scale_embedding: false
|
| 975 |
+
sep_token_id: null
|
| 976 |
+
suppress_tokens: null
|
| 977 |
+
task_specific_params: null
|
| 978 |
+
temperature: 1
|
| 979 |
+
tf_legacy_loss: false
|
| 980 |
+
tie_encoder_decoder: false
|
| 981 |
+
tie_word_embeddings: true
|
| 982 |
+
tokenizer_class: null
|
| 983 |
+
top_k: 50
|
| 984 |
+
top_p: 1
|
| 985 |
+
torchscript: false
|
| 986 |
+
typical_p: 1
|
| 987 |
+
use_bfloat16: false
|
| 988 |
+
audio_end_token_id: 151670
|
| 989 |
+
audio_start_token_id: 151669
|
| 990 |
+
audio_token_id: 151676
|
| 991 |
+
bad_words_ids: null
|
| 992 |
+
begin_suppress_tokens: null
|
| 993 |
+
bos_token_id: null
|
| 994 |
+
chunk_size_feed_forward: 0
|
| 995 |
+
cross_attention_hidden_size: null
|
| 996 |
+
decoder_start_token_id: null
|
| 997 |
+
diversity_penalty: 0
|
| 998 |
+
do_sample: false
|
| 999 |
+
dtype: bfloat16
|
| 1000 |
+
early_stopping: false
|
| 1001 |
+
encoder_no_repeat_ngram_size: 0
|
| 1002 |
+
eos_token_id: null
|
| 1003 |
+
exponential_decay_length_penalty: null
|
| 1004 |
+
finetuning_task: null
|
| 1005 |
+
forced_bos_token_id: null
|
| 1006 |
+
forced_eos_token_id: null
|
| 1007 |
+
id2label:
|
| 1008 |
+
"0": LABEL_0
|
| 1009 |
+
"1": LABEL_1
|
| 1010 |
+
initializer_range: 0.02
|
| 1011 |
+
is_decoder: false
|
| 1012 |
+
is_encoder_decoder: false
|
| 1013 |
+
label2id:
|
| 1014 |
+
LABEL_0: 0
|
| 1015 |
+
LABEL_1: 1
|
| 1016 |
+
length_penalty: 1
|
| 1017 |
+
max_length: 20
|
| 1018 |
+
min_length: 0
|
| 1019 |
+
model_type: qwen3_asr_thinker
|
| 1020 |
+
no_repeat_ngram_size: 0
|
| 1021 |
+
num_beam_groups: 1
|
| 1022 |
+
num_beams: 1
|
| 1023 |
+
num_return_sequences: 1
|
| 1024 |
+
output_attentions: false
|
| 1025 |
+
output_hidden_states: false
|
| 1026 |
+
output_scores: false
|
| 1027 |
+
pad_token_id: null
|
| 1028 |
+
prefix: null
|
| 1029 |
+
problem_type: null
|
| 1030 |
+
remove_invalid_values: false
|
| 1031 |
+
repetition_penalty: 1
|
| 1032 |
+
return_dict: true
|
| 1033 |
+
return_dict_in_generate: false
|
| 1034 |
+
sep_token_id: null
|
| 1035 |
+
suppress_tokens: null
|
| 1036 |
+
task_specific_params: null
|
| 1037 |
+
temperature: 1
|
| 1038 |
+
text_config:
|
| 1039 |
+
_name_or_path: ""
|
| 1040 |
+
add_cross_attention: false
|
| 1041 |
+
architectures: null
|
| 1042 |
+
attention_bias: false
|
| 1043 |
+
attention_dropout: 0
|
| 1044 |
+
bad_words_ids: null
|
| 1045 |
+
begin_suppress_tokens: null
|
| 1046 |
+
bos_token_id: null
|
| 1047 |
+
chunk_size_feed_forward: 0
|
| 1048 |
+
cross_attention_hidden_size: null
|
| 1049 |
+
decoder_start_token_id: null
|
| 1050 |
+
diversity_penalty: 0
|
| 1051 |
+
do_sample: false
|
| 1052 |
+
dtype: null
|
| 1053 |
+
early_stopping: false
|
| 1054 |
+
encoder_no_repeat_ngram_size: 0
|
| 1055 |
+
eos_token_id: null
|
| 1056 |
+
exponential_decay_length_penalty: null
|
| 1057 |
+
finetuning_task: null
|
| 1058 |
+
forced_bos_token_id: null
|
| 1059 |
+
forced_eos_token_id: null
|
| 1060 |
+
head_dim: 128
|
| 1061 |
+
hidden_act: silu
|
| 1062 |
+
hidden_size: 2048
|
| 1063 |
+
id2label:
|
| 1064 |
+
"0": LABEL_0
|
| 1065 |
+
"1": LABEL_1
|
| 1066 |
+
initializer_range: 0.02
|
| 1067 |
+
intermediate_size: 6144
|
| 1068 |
+
is_decoder: false
|
| 1069 |
+
is_encoder_decoder: false
|
| 1070 |
+
label2id:
|
| 1071 |
+
LABEL_0: 0
|
| 1072 |
+
LABEL_1: 1
|
| 1073 |
+
length_penalty: 1
|
| 1074 |
+
max_length: 20
|
| 1075 |
+
max_position_embeddings: 65536
|
| 1076 |
+
min_length: 0
|
| 1077 |
+
model_type: qwen3_asr_text
|
| 1078 |
+
no_repeat_ngram_size: 0
|
| 1079 |
+
num_attention_heads: 16
|
| 1080 |
+
num_beam_groups: 1
|
| 1081 |
+
num_beams: 1
|
| 1082 |
+
num_hidden_layers: 28
|
| 1083 |
+
num_key_value_heads: 8
|
| 1084 |
+
num_return_sequences: 1
|
| 1085 |
+
output_attentions: false
|
| 1086 |
+
output_hidden_states: false
|
| 1087 |
+
output_scores: false
|
| 1088 |
+
pad_token_id: 151643
|
| 1089 |
+
prefix: null
|
| 1090 |
+
problem_type: null
|
| 1091 |
+
remove_invalid_values: false
|
| 1092 |
+
repetition_penalty: 1
|
| 1093 |
+
return_dict: true
|
| 1094 |
+
return_dict_in_generate: false
|
| 1095 |
+
rms_norm_eps: 1e-06
|
| 1096 |
+
rope_scaling:
|
| 1097 |
+
interleaved: true
|
| 1098 |
+
mrope_interleaved: true
|
| 1099 |
+
mrope_section:
|
| 1100 |
+
- 24
|
| 1101 |
+
- 20
|
| 1102 |
+
- 20
|
| 1103 |
+
rope_type: default
|
| 1104 |
+
type: default
|
| 1105 |
+
rope_theta: 1000000
|
| 1106 |
+
sep_token_id: null
|
| 1107 |
+
suppress_tokens: null
|
| 1108 |
+
task_specific_params: null
|
| 1109 |
+
temperature: 1
|
| 1110 |
+
tf_legacy_loss: false
|
| 1111 |
+
tie_encoder_decoder: false
|
| 1112 |
+
tie_word_embeddings: true
|
| 1113 |
+
tokenizer_class: null
|
| 1114 |
+
top_k: 50
|
| 1115 |
+
top_p: 1
|
| 1116 |
+
torchscript: false
|
| 1117 |
+
typical_p: 1
|
| 1118 |
+
use_bfloat16: false
|
| 1119 |
+
use_cache: false
|
| 1120 |
+
vocab_size: 151936
|
| 1121 |
+
tf_legacy_loss: false
|
| 1122 |
+
tie_encoder_decoder: false
|
| 1123 |
+
tie_word_embeddings: true
|
| 1124 |
+
tokenizer_class: null
|
| 1125 |
+
top_k: 50
|
| 1126 |
+
top_p: 1
|
| 1127 |
+
torchscript: false
|
| 1128 |
+
typical_p: 1
|
| 1129 |
+
use_bfloat16: false
|
| 1130 |
+
user_token_id: 872
|
| 1131 |
+
tie_encoder_decoder:
|
| 1132 |
+
value: false
|
| 1133 |
+
tie_word_embeddings:
|
| 1134 |
+
value: true
|
| 1135 |
+
tokenizer_class:
|
| 1136 |
+
value: null
|
| 1137 |
+
top_entropy_quantile:
|
| 1138 |
+
value: 1
|
| 1139 |
+
top_k:
|
| 1140 |
+
value: 50
|
| 1141 |
+
top_p:
|
| 1142 |
+
value: 0.95
|
| 1143 |
+
torch_compile:
|
| 1144 |
+
value: false
|
| 1145 |
+
torch_compile_backend:
|
| 1146 |
+
value: null
|
| 1147 |
+
torch_compile_mode:
|
| 1148 |
+
value: null
|
| 1149 |
+
torch_empty_cache_steps:
|
| 1150 |
+
value: null
|
| 1151 |
+
torchdynamo:
|
| 1152 |
+
value: null
|
| 1153 |
+
torchscript:
|
| 1154 |
+
value: false
|
| 1155 |
+
tpu_metrics_debug:
|
| 1156 |
+
value: false
|
| 1157 |
+
tpu_num_cores:
|
| 1158 |
+
value: null
|
| 1159 |
+
trackio_space_id:
|
| 1160 |
+
value: trackio
|
| 1161 |
+
train_dataloader_shuffle:
|
| 1162 |
+
value: true
|
| 1163 |
+
transformers_version:
|
| 1164 |
+
value: 4.57.6
|
| 1165 |
+
tuner_backend:
|
| 1166 |
+
value: peft
|
| 1167 |
+
tuner_type:
|
| 1168 |
+
value: lora
|
| 1169 |
+
typical_p:
|
| 1170 |
+
value: 1
|
| 1171 |
+
use_bfloat16:
|
| 1172 |
+
value: false
|
| 1173 |
+
use_bias_correction_kl:
|
| 1174 |
+
value: false
|
| 1175 |
+
use_cpu:
|
| 1176 |
+
value: false
|
| 1177 |
+
use_flash_ckpt:
|
| 1178 |
+
value: false
|
| 1179 |
+
use_galore:
|
| 1180 |
+
value: false
|
| 1181 |
+
use_legacy_prediction_loop:
|
| 1182 |
+
value: false
|
| 1183 |
+
use_liger_kernel:
|
| 1184 |
+
value: false
|
| 1185 |
+
use_logits_to_keep:
|
| 1186 |
+
value: null
|
| 1187 |
+
use_mps_device:
|
| 1188 |
+
value: false
|
| 1189 |
+
use_transformers_paged:
|
| 1190 |
+
value: false
|
| 1191 |
+
use_vllm:
|
| 1192 |
+
value: false
|
| 1193 |
+
vit_gradient_checkpointing:
|
| 1194 |
+
value: true
|
| 1195 |
+
vit_lr:
|
| 1196 |
+
value: null
|
| 1197 |
+
vllm_data_parallel_size:
|
| 1198 |
+
value: 1
|
| 1199 |
+
vllm_disable_cascade_attn:
|
| 1200 |
+
value: false
|
| 1201 |
+
vllm_disable_custom_all_reduce:
|
| 1202 |
+
value: true
|
| 1203 |
+
vllm_enable_expert_parallel:
|
| 1204 |
+
value: false
|
| 1205 |
+
vllm_enable_lora:
|
| 1206 |
+
value: false
|
| 1207 |
+
vllm_enable_prefix_caching:
|
| 1208 |
+
value: true
|
| 1209 |
+
vllm_enable_sleep_mode:
|
| 1210 |
+
value: false
|
| 1211 |
+
vllm_enforce_eager:
|
| 1212 |
+
value: false
|
| 1213 |
+
vllm_gpu_memory_utilization:
|
| 1214 |
+
value: 0.9
|
| 1215 |
+
vllm_group_port:
|
| 1216 |
+
value: 51216
|
| 1217 |
+
vllm_importance_sampling_cap:
|
| 1218 |
+
value: 3
|
| 1219 |
+
vllm_importance_sampling_correction:
|
| 1220 |
+
value: true
|
| 1221 |
+
vllm_importance_sampling_mode:
|
| 1222 |
+
value: sequence_mask
|
| 1223 |
+
vllm_limit_mm_per_prompt:
|
| 1224 |
+
value: null
|
| 1225 |
+
vllm_max_lora_rank:
|
| 1226 |
+
value: 16
|
| 1227 |
+
vllm_max_model_len:
|
| 1228 |
+
value: null
|
| 1229 |
+
vllm_max_model_length:
|
| 1230 |
+
value: null
|
| 1231 |
+
vllm_max_num_seqs:
|
| 1232 |
+
value: null
|
| 1233 |
+
vllm_mm_processor_cache_gb:
|
| 1234 |
+
value: null
|
| 1235 |
+
vllm_mode:
|
| 1236 |
+
value: null
|
| 1237 |
+
vllm_model_impl:
|
| 1238 |
+
value: vllm
|
| 1239 |
+
vllm_pipeline_parallel_size:
|
| 1240 |
+
value: 1
|
| 1241 |
+
vllm_quantization:
|
| 1242 |
+
value: null
|
| 1243 |
+
vllm_reasoning_parser:
|
| 1244 |
+
value: null
|
| 1245 |
+
vllm_server_base_url:
|
| 1246 |
+
value: null
|
| 1247 |
+
vllm_server_group_port:
|
| 1248 |
+
value: null
|
| 1249 |
+
vllm_server_host:
|
| 1250 |
+
value: null
|
| 1251 |
+
vllm_server_pass_dataset:
|
| 1252 |
+
value: false
|
| 1253 |
+
vllm_server_port:
|
| 1254 |
+
value:
|
| 1255 |
+
- 8000
|
| 1256 |
+
vllm_server_timeout:
|
| 1257 |
+
value: 240
|
| 1258 |
+
vllm_speculative_config:
|
| 1259 |
+
value: null
|
| 1260 |
+
vllm_structured_outputs_regex:
|
| 1261 |
+
value: null
|
| 1262 |
+
vllm_tensor_parallel_size:
|
| 1263 |
+
value: 1
|
| 1264 |
+
vllm_use_async_engine:
|
| 1265 |
+
value: null
|
| 1266 |
+
wandb_log_unique_prompts:
|
| 1267 |
+
value: null
|
| 1268 |
+
warmup_ratio:
|
| 1269 |
+
value: 0.03
|
| 1270 |
+
warmup_steps:
|
| 1271 |
+
value: 0
|
| 1272 |
+
weight_decay:
|
| 1273 |
+
value: 0.1
|
wandb/run-20260417_125349-3c0s7mq3/files/media/table/completions_1_1de95d5626025fdbb34e.table.json
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"columns": ["step", "prompt", "completion", "ASRWerSubLenCmpHalluDirtyV56", "advantages", "solution"], "data": [["1", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>I had stood by him, whatever the others said.<|im_end|>", -0.18555980920791626, -0.256487101316452, "i'd ha stood by him whatever the others said"], ["1", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>I had stood by him, whatever the others said.<|im_end|>", -0.18555980920791626, -0.256487101316452, "i'd ha stood by him whatever the others said"], ["1", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>I had stood by him, whatever the others said.<|im_end|>", -0.18555980920791626, -0.256487101316452, "i'd ha stood by him whatever the others said"], ["1", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>I had stood by him, whatever the others said.<|im_end|>", -0.18555980920791626, -0.256487101316452, "i'd ha stood by him whatever the others said"], ["1", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>I had stood by him, whatever the others said.<|im_end|>", -0.18555980920791626, -0.256487101316452, "i'd ha stood by him whatever the others said"], ["1", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>I had stood by him, whatever the others said.<|im_end|>", -0.18555980920791626, -0.256487101316452, "i'd ha stood by him whatever the others said"], ["1", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>I had stood by him, whatever the others said.<|im_end|>", -0.18555980920791626, -0.256487101316452, "i'd ha stood by him whatever the others said"], ["1", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>I had stood by him, whatever the others said.<|im_end|>", -0.18555980920791626, -0.256487101316452, "i'd ha stood by him whatever the others said"], ["1", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>I had stood by him, whatever the others said.<|im_end|>", -0.18555980920791626, -0.256487101316452, "i'd ha stood by him whatever the others said"], ["1", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>I had stood by him, whatever the others said.<|im_end|>", -0.18555980920791626, -0.256487101316452, "i'd ha stood by him whatever the others said"], ["1", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>I has stood by him, whatever the others said.<|im_end|>", -0.18279924988746643, 2.8213913440704346, "i'd ha stood by him whatever the others said"], ["1", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>I had stood by him, whatever the others said.<|im_end|>", -0.18555980920791626, -0.256487101316452, "i'd ha stood by him whatever the others said"], ["1", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>The reverend rectumist passed his hand wearily over his brow a hill with a faint noise of running up stairs somewhere we never touched the beastly box, said he then your competitors did said missus naylor no no said the curate hastily<|im_end|>", -0.2760888338088989, -0.9180124998092651, "The reverend septimus passed his hand wearily over his brow. I feel a little faint, he said, running upstairs so quickly, we never touched the beastly box, said robert. Then your confederates did said miss selina. No, no, said the curate hastily."], ["1", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>The reverend recteur passed his hand wearily over his brow a hill with a faint memory of running upstairs so quickly, we never touched the beastly box said he then your competitor is dead said missus nisbet no, no said the curate hastily.<|im_end|>", -0.09747578948736191, 0.25090181827545166, "The reverend septimus passed his hand wearily over his brow. I feel a little faint, he said, running upstairs so quickly, we never touched the beastly box, said robert. Then your confederates did said miss selina. No, no, said the curate hastily."], ["1", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>The reverend recteur passed his hand wearily over his brow a hill with a fainting spell in it upstairs, he said. We never touched the beastly box before and your competitor did, said missus nina no, no, said the curate hastily.<|im_end|>", -0.4100283682346344, -1.7945656776428223, "The reverend septimus passed his hand wearily over his brow. I feel a little faint, he said, running upstairs so quickly, we never touched the beastly box, said robert. Then your confederates did said miss selina. No, no, said the curate hastily."], ["1", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>The reverend rectory passed his hand wearily over his brow. I feel a little faint, Missus Allen, upstairs said vicar. We never touched the beastly box, did we? Then your competitor is dead, said missus allen no no said the curate hastily.<|im_end|>", 0.06087213382124901, 1.2871931791305542, "The reverend septimus passed his hand wearily over his brow. I feel a little faint, he said, running upstairs so quickly, we never touched the beastly box, said robert. Then your confederates did said miss selina. No, no, said the curate hastily."], ["1", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>The reverend recteur passed his hand wearily over his brow a hillwood of faintness and running upstairs so quickly we never touched the beastly box said the vicar then your competitor did said missus nelly no, no said the curate hastily<|im_end|>", -0.06288440525531769, 0.47728151082992554, "The reverend septimus passed his hand wearily over his brow. I feel a little faint, he said, running upstairs so quickly, we never touched the beastly box, said robert. Then your confederates did said miss selina. No, no, said the curate hastily."], ["1", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>The reverend recteur passed his hand wearily over his brow a hill of saint nicholas went upstairs so quickly we never touched the beastly box then your competitor did said missus nixon no, no, said the curate hastily.<|im_end|>", 0.01360579114407301, 0.9778635501861572, "The reverend septimus passed his hand wearily over his brow. I feel a little faint, he said, running upstairs so quickly, we never touched the beastly box, said robert. Then your confederates did said miss selina. No, no, said the curate hastily."], ["1", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>The reverend rectumist passed his hand wearily over his brow a still little faintness had been running up stairs since dinner. We never touched the beastly box, said he and your competitor did, said missus anna no, no, said the curate hastily.<|im_end|>", -0.15452256798744202, -0.1224348247051239, "The reverend septimus passed his hand wearily over his brow. I feel a little faint, he said, running upstairs so quickly, we never touched the beastly box, said robert. Then your confederates did said miss selina. No, no, said the curate hastily."], ["1", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>The reverend recteur passed his hand wearily over his brow, a hill with a faint memory of running upstairs so quickly. We never touched the beastly box before. Then your competitor did said missus nixon no no said the curate hastily.<|im_end|>", -0.17706401646137238, -0.26995497941970825, "The reverend septimus passed his hand wearily over his brow. I feel a little faint, he said, running upstairs so quickly, we never touched the beastly box, said robert. Then your confederates did said miss selina. No, no, said the curate hastily."], ["1", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>The reverend rectumist passed his hand wearily over his brow a hillwood of faintness and running upstairs so quickly, we never touched the beastly box. Then your competitor did said missus nixon no no said the curate hastily.<|im_end|>", 0.016543198376893997, 0.9970871210098267, "The reverend septimus passed his hand wearily over his brow. I feel a little faint, he said, running upstairs so quickly, we never touched the beastly box, said robert. Then your confederates did said miss selina. No, no, said the curate hastily."], ["1", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>The reverend rectors passed his hand wearily over his brow, a hill with a faint memory of running upstairs so quickly. We never touched the beastly box. Then your competitor did said missus neale no no said the curate hastily.<|im_end|>", -0.1560557782649994, -0.13246876001358032, "The reverend septimus passed his hand wearily over his brow. I feel a little faint, he said, running upstairs so quickly, we never touched the beastly box, said robert. Then your confederates did said miss selina. No, no, said the curate hastily."], ["1", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>The reverend recteur passed his hand wearily over his brow a hill with a faint moonlight running upstairs so quickly, we never touched the beastly box said he then you're a competitor, it seems said missus nixon no no said the curate hastily<|im_end|>", -0.36874449253082275, -1.5243877172470093, "The reverend septimus passed his hand wearily over his brow. I feel a little faint, he said, running upstairs so quickly, we never touched the beastly box, said robert. Then your confederates did said miss selina. No, no, said the curate hastily."], ["1", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>The reverend recteur passed his hand wearily over his brow, I feel a little faint now that I am upstairs so quickly. We never touched the vesuvio, said the doctor. Then your competitors did, said missus nina. No, no, said the curate hastily.<|im_end|>", -0.01792760007083416, 0.771496593952179, "The reverend septimus passed his hand wearily over his brow. I feel a little faint, he said, running upstairs so quickly, we never touched the beastly box, said robert. Then your confederates did said miss selina. No, no, said the curate hastily."], ["1", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>There was much armaghajt in my cousin's sister, the political aspect of the revolution is fenced changing almost every day she might not understand how his own views and sympathies might often modify her.<|im_end|>", -0.025386638939380646, -1.575260877609253, "There was much armand saint just could not tell his sister the political aspect of the revolution in france was changing almost every day. She might not understand how his own views and sympathies might become modified."], ["1", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>There was much armagnac julec in my parent's estate, the political aspect of the revolution since changing almost every day she might not understand how his own views and sympathies might often modify them.<|im_end|>", -0.03027840331196785, -1.6189521551132202, "There was much armand saint just could not tell his sister the political aspect of the revolution in france was changing almost every day. She might not understand how his own views and sympathies might become modified."], ["1", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>There was much armagnac jokes with my cousins and sister, the political aspect of the revolution in france changing almost every day she might not understand how his own views and sympathies might differ from mine.<|im_end|>", 0.10477012395858765, -0.41274797916412354, "There was much armand saint just could not tell his sister the political aspect of the revolution in france was changing almost every day. She might not understand how his own views and sympathies might become modified."], ["1", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>There was much armagnac joke for my cousin sister, the political aspect of the revolution in france changing almost every day she might not understand how his own views and sympathies might often modify those.<|im_end|>", 0.11768282204866409, -0.29741644859313965, "There was much armand saint just could not tell his sister the political aspect of the revolution in france was changing almost every day. She might not understand how his own views and sympathies might become modified."], ["1", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>There was much armagnac joke from my cousin sister, the political aspect of the revolution in france changing almost every day she might not understand how his own views and sympathies might be modified.<|im_end|>", 0.2628527879714966, 0.9991887807846069, "There was much armand saint just could not tell his sister the political aspect of the revolution in france was changing almost every day. She might not understand how his own views and sympathies might become modified."], ["1", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>There was much armageddus in my present system. The political aspect of the revolution is hence changing almost every day. She might not understand how his own views and sympathies might often modify mine.<|im_end|>", 0.05142616108059883, -0.8891968727111816, "There was much armand saint just could not tell his sister the political aspect of the revolution in france was changing almost every day. She might not understand how his own views and sympathies might become modified."], ["1", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>There was much armagnac, jute and matelot in his tea. The political aspect of the revolution is hence changing almost every day. She might not understand how his own views and sympathies might have been modified.<|im_end|>", 0.18227215111255646, 0.27947190403938293, "There was much armand saint just could not tell his sister the political aspect of the revolution in france was changing almost every day. She might not understand how his own views and sympathies might become modified."], ["1", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>There was much armagnac, jute for my companion sister. The political aspect of the revolution in france changing almost every day. She might not understand how his own views and sympathies might often modify.<|im_end|>", 0.257134348154068, 0.9481137990951538, "There was much armand saint just could not tell his sister the political aspect of the revolution in france was changing almost every day. She might not understand how his own views and sympathies might become modified."], ["1", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>There was much armagnac yoke to my cousin's sister, the political aspect of the revolution in france changing almost every day she might not understand how his own views and sympathies might differ from mine.<|im_end|>", 0.11708571761846542, -0.3027495741844177, "There was much armand saint just could not tell his sister the political aspect of the revolution in france was changing almost every day. She might not understand how his own views and sympathies might become modified."], ["1", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>There was much armagnac joke to my cousin's sister, the political aspect of the revolution in france changing almost every day she might not understand how his own views and sympathies might be modified.<|im_end|>", 0.2641826272010803, 1.0110664367675781, "There was much armand saint just could not tell his sister the political aspect of the revolution in france was changing almost every day. She might not understand how his own views and sympathies might become modified."], ["1", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>There was much armagnac joke with my cousins sister, the political aspect of the revolution in france changing almost every day she might not understand how his own views and sympathies might be modified.<|im_end|>", 0.26373809576034546, 1.0070960521697998, "There was much armand saint just could not tell his sister the political aspect of the revolution in france was changing almost every day. She might not understand how his own views and sympathies might become modified."], ["1", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>There was much armagnac yet for my traveling sister. The political aspect of the revolution in france is changing almost every day. She might not understand how her own views and sympathies might be modified.<|im_end|>", 0.24630455672740936, 0.8513860106468201, "There was much armand saint just could not tell his sister the political aspect of the revolution in france was changing almost every day. She might not understand how his own views and sympathies might become modified."], ["1", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Never, private or public, that the order should be payable in India and to bear an interest of five per cent if these orders were supposed to be vicious by reason of being purchased he secondly with very little hesitation adopted both orders were immediately printed.<|im_end|>", -0.3420386016368866, -0.659913957118988, "and therefore i propos'd that the orders should be payable in a year and to bear an interest of five per cent with these orders i suppos'd the provisions might easily be purchas'd the assembly with very little hesitation adopted the proposal the orders were immediately printed"], ["1", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Never, rather opposed that the order should be payable in India and do bear an interest of five per cent if these orders were disposed of provisions might easily be purchased he seconded with very little hesitation adopted both orders were immediately printed.<|im_end|>", -0.032027214765548706, 1.195294737815857, "and therefore i propos'd that the orders should be payable in a year and to bear an interest of five per cent with these orders i suppos'd the provisions might easily be purchas'd the assembly with very little hesitation adopted the proposal the orders were immediately printed"], ["1", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Never, either of both that they ordered it should be payable in a year and do bear an interest of five per cent if these orders were disposed of provisions might easily be purchased he said with very little hesitation adopted by both orders were immediately printed.<|im_end|>", -0.04057157412171364, 1.1441625356674194, "and therefore i propos'd that the orders should be payable in a year and to bear an interest of five per cent with these orders i suppos'd the provisions might easily be purchas'd the assembly with very little hesitation adopted the proposal the orders were immediately printed"], ["1", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Never prior to public opinion that the order should be payable in any and do bearing interest of five per cent if these orders were supposed provisionists might easily be purchased this enactment with very little hesitation adopted by both voters were immediately printed.<|im_end|>", -0.3433881402015686, -0.6679900288581848, "and therefore i propos'd that the orders should be payable in a year and to bear an interest of five per cent with these orders i suppos'd the provisions might easily be purchas'd the assembly with very little hesitation adopted the proposal the orders were immediately printed"], ["1", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Never, prior to the public that they ordered it should be payable in a year and do bear an interest of five per cent if these orders were disposed of provisionally at least would be purchased he said with very little hesitation adopted both orders were immediately printed.<|im_end|>", -0.33630597591400146, -0.6256080865859985, "and therefore i propos'd that the orders should be payable in a year and to bear an interest of five per cent with these orders i suppos'd the provisions might easily be purchas'd the assembly with very little hesitation adopted the proposal the orders were immediately printed"], ["1", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Never prior to publication that the order should be payable in any year and do bear an interest of five per cent if these orders were disposed of provisionally at least could be purchased he said with very little hesitation adopted both orders were immediately printed<|im_end|>", -0.1676534116268158, 0.3836635649204254, "and therefore i propos'd that the orders should be payable in a year and to bear an interest of five per cent with these orders i suppos'd the provisions might easily be purchas'd the assembly with very little hesitation adopted the proposal the orders were immediately printed"], ["1", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Never prior to public opinion that they ordered it should be payable in India and do bear an interest of five per cent if these orders were supposed provision is likely soon to be purchased this act with very little hesitation adopted by both voters were immediately printed.<|im_end|>", -0.5411341190338135, -1.8513660430908203, "and therefore i propos'd that the orders should be payable in a year and to bear an interest of five per cent with these orders i suppos'd the provisions might easily be purchas'd the assembly with very little hesitation adopted the proposal the orders were immediately printed"], ["1", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Never prior to public debate that the order should be payable in England and do bear an interest of five per cent if these orders were to suppose the provisions might easily be purchased he seconded with very little hesitation adopted both orders were immediately printed.<|im_end|>", -0.07721911370754242, 0.9248517155647278, "and therefore i propos'd that the orders should be payable in a year and to bear an interest of five per cent with these orders i suppos'd the provisions might easily be purchas'd the assembly with very little hesitation adopted the proposal the orders were immediately printed"], ["1", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Never, prior to publication that they ordered it should be payable in a year and do bear an interest of five per cent if these orders were disposed of provisionally at least would be purchased is now with very little hesitation adopted both orders were immediately printed<|im_end|>", -0.22012776136398315, 0.06964004039764404, "and therefore i propos'd that the orders should be payable in a year and to bear an interest of five per cent with these orders i suppos'd the provisions might easily be purchas'd the assembly with very little hesitation adopted the proposal the orders were immediately printed"], ["1", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Never prior to published that the order should be payable in a year and do bear an interest of five per cent, if these orders were disposed of provisionally at least would be purchased he seconded with very little hesitation adopted both orders were immediately printed<|im_end|>", -0.16621676087379456, 0.39226093888282776, "and therefore i propos'd that the orders should be payable in a year and to bear an interest of five per cent with these orders i suppos'd the provisions might easily be purchas'd the assembly with very little hesitation adopted the proposal the orders were immediately printed"], ["1", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Never, cried her beloved, that the order should be payable in England and do bear interest at five per cent if these orders were disposed of provisionally at least would they purchase he said with very little hesitation adopted them both the orders were immediately printed.<|im_end|>", -0.4380200207233429, -1.2342978715896606, "and therefore i propos'd that the orders should be payable in a year and to bear an interest of five per cent with these orders i suppos'd the provisions might easily be purchas'd the assembly with very little hesitation adopted the proposal the orders were immediately printed"], ["1", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Never prior to public debate that they ordered it should be payable in a year and to bear an interest of five per cent if these orders were supposed provisionists might easily be purchased he seconded with very little hesitation adopted both orders were immediately printed.<|im_end|>", -0.07647529989480972, 0.9293028712272644, "and therefore i propos'd that the orders should be payable in a year and to bear an interest of five per cent with these orders i suppos'd the provisions might easily be purchas'd the assembly with very little hesitation adopted the proposal the orders were immediately printed"]]}
|
wandb/run-20260417_125349-3c0s7mq3/files/media/table/completions_3_b8120af2e2a4bc038eb5.table.json
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"columns": ["step", "prompt", "completion", "ASRWerSubLenCmpHalluDirtyV56", "advantages", "solution"], "data": [["5", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Coordinating and shifting, collectively said he sheu, divided with each other in forming new combinations. We must remember however that the flower worship of the tibetans was formed from only a part of their ascetic ritual and it was not a distinct religion by itself.<|im_end|>", 0.06746125966310501, 0.25112149119377136, "kobori enshiu katagiri sekishiu vied with each other in forming new combinations we must remember however that the flower worship of the tea masters formed only a part of their aesthetic ritual and was not a distinct religion by itself"], ["5", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Kohori and shi no katanu ni seki shi no vied with each other in forming new combinations. We must remember, however, that the flower worship of the tea masters formed only a part of their ascetic ritual, and it was not a distinct religion by itself.<|im_end|>", 0.008763517253100872, -0.30829519033432007, "kobori enshiu katagiri sekishiu vied with each other in forming new combinations we must remember however that the flower worship of the tea masters formed only a part of their aesthetic ritual and was not a distinct religion by itself"], ["5", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Coordinating and shifting, collectively setting shift, fighting with each other in forming new combinations. We must remember, however, that the flower worship of the teengas performed only a part of their respective ritual, and was not a distinct religion by itself.<|im_end|>", -0.017216404899954796, -0.5558958649635315, "kobori enshiu katagiri sekishiu vied with each other in forming new combinations we must remember however that the flower worship of the tea masters formed only a part of their aesthetic ritual and was not a distinct religion by itself"], ["5", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Coordinating and shifting, collectively said he she would divide with each other in forming new combinations we must remember however that the flower worship of the tibetans was formed from only a part of their ascetic ritual and it was not a distinct religion by itself<|im_end|>", 0.13382616639137268, 0.8836097717285156, "kobori enshiu katagiri sekishiu vied with each other in forming new combinations we must remember however that the flower worship of the tea masters formed only a part of their aesthetic ritual and was not a distinct religion by itself"], ["5", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Coordinating shibumi, kafanguiyaseki shibumi, fight with each other in forming new combinations. We must remember, however, that the flower worship of the teikos was formed from only a part of their ascetic ritual and it was not a distinct religion by itself.<|im_end|>", 0.12175671756267548, 0.7685823440551758, "kobori enshiu katagiri sekishiu vied with each other in forming new combinations we must remember however that the flower worship of the tea masters formed only a part of their aesthetic ritual and was not a distinct religion by itself"], ["5", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Coordinating and shifting, collectively city shifted, fighting with each other in forming new combinations. We must remember, however, that the flower worship of the teentots performed only a part of their ascetic ritual, and it was not a distinct religion by itself.<|im_end|>", -0.07603159546852112, -1.1164319515228271, "kobori enshiu katagiri sekishiu vied with each other in forming new combinations we must remember however that the flower worship of the tea masters formed only a part of their aesthetic ritual and was not a distinct religion by itself"], ["5", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Coordinating shiwoo, collectively said yishii, vied with each other in forming new combinations. We must remember however that the flower worship of the teegas was but only a part of their ascetic ritual, and it was not a distinct religion by itself.<|im_end|>", 0.18717117607593536, 1.3920124769210815, "kobori enshiu katagiri sekishiu vied with each other in forming new combinations we must remember however that the flower worship of the tea masters formed only a part of their aesthetic ritual and was not a distinct religion by itself"], ["5", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Coordinating and shifting, coupling these subunits, varied with each other in forming new combinations. We must remember, however, that the flower worship of the teentas performed only a part of their ascetic ritual, and it was not a distinct religion by itself.<|im_end|>", -0.07198049873113632, -1.0778230428695679, "kobori enshiu katagiri sekishiu vied with each other in forming new combinations we must remember however that the flower worship of the tea masters formed only a part of their aesthetic ritual and was not a distinct religion by itself"], ["5", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Coordinating and shu, ka te nuisi se ki shu fight with each other in forming new combinations we must remember however that the flower worship of the tinus performed only a part of their ascetic ritual and was not a distinct religion by itself.<|im_end|>", 0.0946241021156311, 0.5099959969520569, "kobori enshiu katagiri sekishiu vied with each other in forming new combinations we must remember however that the flower worship of the tea masters formed only a part of their aesthetic ritual and was not a distinct religion by itself"], ["5", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Kohori and shiromu kafanuri, sakiishi, vied with each other in forming new combinations. We must remember however that the flower worship of the teiyas was but only a part of their ascetic ritual, and it was not a distinct religion by itself.<|im_end|>", 0.193635493516922, 1.453620433807373, "kobori enshiu katagiri sekishiu vied with each other in forming new combinations we must remember however that the flower worship of the tea masters formed only a part of their aesthetic ritual and was not a distinct religion by itself"], ["5", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Coordinating and shifting, collectively setting shift, fighting with each other in forming new combinations. We must remember, however, that the flower worship of the teentas performed only a part of their ascetic ritual, and it was not a distinct religion by itself.<|im_end|>", -0.0758325457572937, -1.1145349740982056, "kobori enshiu katagiri sekishiu vied with each other in forming new combinations we must remember however that the flower worship of the tea masters formed only a part of their aesthetic ritual and was not a distinct religion by itself"], ["5", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Cohorti and instituti, capellanus et institutus, fight with each other in forming new combinations. We must remember, however, that the flower worship of the tegots was formed from only a part of their ascetic ritual, and it was not a distinct religion by itself.<|im_end|>", -0.07283444702625275, -1.0859616994857788, "kobori enshiu katagiri sekishiu vied with each other in forming new combinations we must remember however that the flower worship of the tea masters formed only a part of their aesthetic ritual and was not a distinct religion by itself"], ["5", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>With red hot boulders lying about everywhere, d'you think it went off well? Creedle he asked her. The victuals did that I know and the drink did that I set fast in believe upon a sound of barrels good honest drink.<|im_end|>", 0.16612012684345245, -0.016373056918382645, "with red hot bowlders lying about everywhere do you think it went off well creedle he asked the victuals did that i know and the drink did that i steadfastly believe from the holler sound of the barrels good honest drink"], ["5", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>With red hot boulders lying about everywhere, d'you think it went off well? Creedele he asked me. The victuals did that I know and the drink did that I set fasty believe upon a sound of barrels good honest drink.<|im_end|>", 0.15556275844573975, -0.08780591189861298, "with red hot bowlders lying about everywhere do you think it went off well creedle he asked the victuals did that i know and the drink did that i steadfastly believe from the holler sound of the barrels good honest drink"], ["5", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>With red hot bolters flying about everywhere, do you think it went off well creedle? He asked me the victuals did that I know and the drink did that I set fast to believe upon a sound of barrels good honest strength.<|im_end|>", 0.2218746393918991, 0.36087095737457275, "with red hot bowlders lying about everywhere do you think it went off well creedle he asked the victuals did that i know and the drink did that i steadfastly believe from the holler sound of the barrels good honest drink"], ["5", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>With red hot boulders lying about everywhere, do you think it went off well? Creedle he asked her. The victuals did that I know and the drink did that I steadfastly believe upon a chance of barrels good honest drink.<|im_end|>", 0.42252233624458313, 1.7184855937957764, "with red hot bowlders lying about everywhere do you think it went off well creedle he asked the victuals did that i know and the drink did that i steadfastly believe from the holler sound of the barrels good honest drink"], ["5", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>With red hot boulders flying about everywhere, do you think it went off well? Creel he asked. The victuals did that I know and the drink did that I set fasty believe upon a shanty barrels good honest strength.<|im_end|>", 0.07005643844604492, -0.6663554310798645, "with red hot bowlders lying about everywhere do you think it went off well creedle he asked the victuals did that i know and the drink did that i steadfastly believe from the holler sound of the barrels good honest drink"], ["5", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>With red hot bolters flying about everywhere, do you think it went off well? Creedle he asked her. The victuals did that I know and the drink did that I set fast to believe upon a challenge of barrels good honest strength.<|im_end|>", 0.1369437873363495, -0.21378487348556519, "with red hot bowlders lying about everywhere do you think it went off well creedle he asked the victuals did that i know and the drink did that i steadfastly believe from the holler sound of the barrels good honest drink"], ["5", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>With red hot boulders flying about everywhere, do you think it went off well? Creel he asked the victors did that I know and the drink did that I steadfastly believe upon a sound of barrels good honest drink.<|im_end|>", 0.3446210026741028, 1.1913926601409912, "with red hot bowlders lying about everywhere do you think it went off well creedle he asked the victuals did that i know and the drink did that i steadfastly believe from the holler sound of the barrels good honest drink"], ["5", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>With red hot boulders flying about everywhere, do you think it went off well? Creedele he asked her, the victuals did that I know and the drink did that I steadfastly believe upon a sound of barrels good honest drink.<|im_end|>", 0.3581290543079376, 1.2827903032302856, "with red hot bowlders lying about everywhere do you think it went off well creedle he asked the victuals did that i know and the drink did that i steadfastly believe from the holler sound of the barrels good honest drink"], ["5", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>With red hot boulders flying about everywhere, do you think it went off well? Creel he asked. The victuals did that I know, and the drink did that I said pass'd me believe upon a trial in barrels good honest drink.<|im_end|>", -0.024973222985863686, -1.309341549873352, "with red hot bowlders lying about everywhere do you think it went off well creedle he asked the victuals did that i know and the drink did that i steadfastly believe from the holler sound of the barrels good honest drink"], ["5", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>With red hot bolters flying about everywhere, d'you think it went off well? Creel he asked her. The victuals did that I know, and the drink did. That I set fasty believe upon a sound of barrels good honest strength.<|im_end|>", -0.054762814193964005, -1.5109026432037354, "with red hot bowlders lying about everywhere do you think it went off well creedle he asked the victuals did that i know and the drink did that i steadfastly believe from the holler sound of the barrels good honest drink"], ["5", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>With red hot boulders lying about everywhere, do you think it went off well? Creel he asked her the victuals did that I know and the drink did that I set fast to believe upon a chance of barrels good honest drink.<|im_end|>", 0.1390748769044876, -0.19936557114124298, "with red hot bowlders lying about everywhere do you think it went off well creedle he asked the victuals did that i know and the drink did that i steadfastly believe from the holler sound of the barrels good honest drink"], ["5", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>With red hot boulders lying about everywhere, d'you think it went off well, creedle? He asked. The victuals did that I know and the drink did that I said must be believed upon a sound of barrels good honest drink.<|im_end|>", 0.08731066435575485, -0.5496105551719666, "with red hot bowlders lying about everywhere do you think it went off well creedle he asked the victuals did that i know and the drink did that i steadfastly believe from the holler sound of the barrels good honest drink"], ["5", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>For it is wonderful how many things may be acquired by some means a writer was once employed in which of course he got continual friends and you pick up mary hansen gilding on the colonies of abies, which seems answer to your friend's wants.<|im_end|>", -0.8597428202629089, -1.7000007629394531, "For it is wonderful how soon these are acquired by some horses. The writer was once employed to purchase a horse for a country friend. And he picked a very handsome gelding out of collins's stables, which seemed to answer to his friend's wants."], ["5", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>For it is wonderful how a name can be acquired by some means the writer was once employed in preaching a course of instruction to friends and repeated very handsome gilding on the columns of statues which seemed to answer to his friend's wants.<|im_end|>", -0.28019994497299194, 0.7384878396987915, "For it is wonderful how soon these are acquired by some horses. The writer was once employed to purchase a horse for a country friend. And he picked a very handsome gelding out of collins's stables, which seemed to answer to his friend's wants."], ["5", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>For it is wonderful how men can be inspired by some things a writer was once employed in preaching a course of lectures to his friends, and he picked up very handsome gelding on the colony's estate which seems answer to the prince's wants.<|im_end|>", -0.4687815308570862, -0.05498935654759407, "For it is wonderful how soon these are acquired by some horses. The writer was once employed to purchase a horse for a country friend. And he picked a very handsome gelding out of collins's stables, which seemed to answer to his friend's wants."], ["5", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>For it is wonderful how names may be acquired by some means. The writer was once employed in preaching before a group of young friends, and repeated his merry fencing gelping on the colonies of babies which seems answer to the friend's wants.<|im_end|>", -0.6376533508300781, -0.7655355930328369, "For it is wonderful how soon these are acquired by some horses. The writer was once employed to purchase a horse for a country friend. And he picked a very handsome gelding out of collins's stables, which seemed to answer to his friend's wants."], ["5", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>For it is wonderful how many things may be acquired by some means. The writer was once employed in purchase of horses from his friends, and repeated a very handsome gelding on the colony's table, which seemed to answer to his friend's wants.<|im_end|>", -0.07159067690372467, 1.6162337064743042, "For it is wonderful how soon these are acquired by some horses. The writer was once employed to purchase a horse for a country friend. And he picked a very handsome gelding out of collins's stables, which seemed to answer to his friend's wants."], ["5", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>For it is wonderful how names can be acquired by some means a writer was once employed in teaching a boy about his own friends, and he picked up very handsome gelding on the colony of cape town which seemed to answer just what he wanted.<|im_end|>", -0.39772796630859375, 0.24397611618041992, "For it is wonderful how soon these are acquired by some horses. The writer was once employed to purchase a horse for a country friend. And he picked a very handsome gelding out of collins's stables, which seemed to answer to his friend's wants."], ["5", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>For it is wonderful how many things are required by some people. The writer was once employed in teaching a course of lectures to his friends, and he picked up very handsome gelding on the colonies of bays which seemed to answer just at his wants.<|im_end|>", -0.31977492570877075, 0.5719718337059021, "For it is wonderful how soon these are acquired by some horses. The writer was once employed to purchase a horse for a country friend. And he picked a very handsome gelding out of collins's stables, which seemed to answer to his friend's wants."], ["5", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>For it is wonderful how a name can be acquired by some means. The writer was once employed in purchase of horses for his friends, and he picked up very handsome geldings on the colonies of scotland, which seems answer to his friend's wants.<|im_end|>", -0.23753882944583893, 0.9179890155792236, "For it is wonderful how soon these are acquired by some horses. The writer was once employed to purchase a horse for a country friend. And he picked a very handsome gelding out of collins's stables, which seemed to answer to his friend's wants."], ["5", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>For it is wonderful how a name can be acquired by some means. The writer was once employed in preaching before a congregation of friends, and repeated very handsome gilding on the columns of tables, which seemed to answer to his friend's wants.<|im_end|>", -0.33328479528427124, 0.5151276588439941, "For it is wonderful how soon these are acquired by some horses. The writer was once employed to purchase a horse for a country friend. And he picked a very handsome gelding out of collins's stables, which seemed to answer to his friend's wants."], ["5", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>For it is wonderful how many names are supplied by some mistake. The writer was once employed in teaching a course of instruction to friends, and repeated Mary Hanson gilding on the colonies of babies, which seems answer to his friend's wants.<|im_end|>", -0.3981190025806427, 0.24233078956604004, "For it is wonderful how soon these are acquired by some horses. The writer was once employed to purchase a horse for a country friend. And he picked a very handsome gelding out of collins's stables, which seemed to answer to his friend's wants."], ["5", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>For it is wonderful how many things can be acquired by some means a writer was once employed in which of course he rubbed his teeth with frank and repeated mary hansen gelling on the colonies of georgia, which seems answer to the friend's wants.<|im_end|>", -0.7842603921890259, -1.382400393486023, "For it is wonderful how soon these are acquired by some horses. The writer was once employed to purchase a horse for a country friend. And he picked a very handsome gelding out of collins's stables, which seemed to answer to his friend's wants."], ["5", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>For it is wonderful how names can be acquired by some mistake. The writer was once employed in teaching a course of natural history at prague, and he pictures mary henshaw gellman on the colony of scotland, which seems answerable to frank's wants.<|im_end|>", -0.6798756718635559, -0.9431905150413513, "For it is wonderful how soon these are acquired by some horses. The writer was once employed to purchase a horse for a country friend. And he picked a very handsome gelding out of collins's stables, which seemed to answer to his friend's wants."], ["5", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>A week after the battle, my brother replied there from the capital of my expedition to make a horrible discovery that followed the eating up of the bodies of our dead heroes at two doors.<|im_end|>", -0.40796396136283875, -0.19726812839508057, "a week after the battle my brother rode by there on a cavalry expedition and made the horrible discovery that hogs were eating up the bodies of our dead heroes that too was war"], ["5", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>A week after the battle, my brother was obliged to enter the capital of my expedition to make a horrible supper at the hall meeting of the bodies of our dead heroes. That too was for it.<|im_end|>", -0.6910028457641602, -0.9820257425308228, "a week after the battle my brother rode by there on a cavalry expedition and made the horrible discovery that hogs were eating up the bodies of our dead heroes that too was war"], ["5", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>A week after the battle, my brother provided her with a capital expedition to make a horrible slaughter at home in eating up the bodies of our dead heroes that too was abortive.<|im_end|>", -0.0851043164730072, 0.6978971362113953, "a week after the battle my brother rode by there on a cavalry expedition and made the horrible discovery that hogs were eating up the bodies of our dead heroes that too was war"], ["5", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>A week after the battle, my brother replied there from the capital of my expedition, in a horrible and stunned, I called at the meeting of the bodies of our dead heroes. That too was a word.<|im_end|>", -0.781724214553833, -1.2335611581802368, "a week after the battle my brother rode by there on a cavalry expedition and made the horrible discovery that hogs were eating up the bodies of our dead heroes that too was war"], ["5", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>A week after the battle, my brother replied there from a capital in my position with a horrible discovery that he had fallen in eating up the bodies of our dead heroes. That too was a word.<|im_end|>", -0.2709154784679413, 0.18271444737911224, "a week after the battle my brother rode by there on a cavalry expedition and made the horrible discovery that hogs were eating up the bodies of our dead heroes that too was war"], ["5", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>A week after the battle, my brother rode by there on a cavalry expedition to make a horrible supper at a hall meeting of the bodies of our dead heroes. That too was thwarted.<|im_end|>", 0.09377644956111908, 1.1938644647598267, "a week after the battle my brother rode by there on a cavalry expedition and made the horrible discovery that hogs were eating up the bodies of our dead heroes that too was war"], ["5", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>A week after the battle, my brother and I were hired by a cavalry expedition to make a horrible study of the fall and eating up of the bodies of our dead heroes. That too was worth it.<|im_end|>", -0.39144468307495117, -0.15146653354167938, "a week after the battle my brother rode by there on a cavalry expedition and made the horrible discovery that hogs were eating up the bodies of our dead heroes that too was war"], ["5", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>A week after the battle, my brother stood by her in a cabin at my expedition and made the horrible discovery that Paul was eating up the body of our dead hero. That too was a word.<|im_end|>", 0.046062320470809937, 1.0615715980529785, "a week after the battle my brother rode by there on a cavalry expedition and made the horrible discovery that hogs were eating up the bodies of our dead heroes that too was war"], ["5", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>A week after the battle, my brother replied there on the capital of my expedition in a most horrible and shocking manner, that he had been the eating up the body of our dead hero. That was true as words.<|im_end|>", -0.8374046683311462, -1.3879414796829224, "a week after the battle my brother rode by there on a cavalry expedition and made the horrible discovery that hogs were eating up the bodies of our dead heroes that too was war"], ["5", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>A week after the battle, my brother replied there in a capital condition, but made the horrible discovery that all were eating up the bodies of our dead heroes at two this morning.<|im_end|>", 0.09645416587591171, 1.2012887001037598, "a week after the battle my brother rode by there on a cavalry expedition and made the horrible discovery that hogs were eating up the bodies of our dead heroes that too was war"], ["5", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>A week after the battle, my brother replied there in a capital condition, but in the horrible stumps that followed eating up the bodies of our dead heroes. That too was worth it.<|im_end|>", -0.051983222365379333, 0.7897290587425232, "a week after the battle my brother rode by there on a cavalry expedition and made the horrible discovery that hogs were eating up the bodies of our dead heroes that too was war"], ["5", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>A week after the battle, my brother replied there from the capital of my expedition, in a most horrible and startling letter that called on me to eat up the bodies of our dead heroes. That too was ordered.<|im_end|>", -0.7605313062667847, -1.1748013496398926, "a week after the battle my brother rode by there on a cavalry expedition and made the horrible discovery that hogs were eating up the bodies of our dead heroes that too was war"]]}
|
wandb/run-20260417_125349-3c0s7mq3/files/media/table/completions_5_510c5f07b145276e4210.table.json
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"columns": ["step", "prompt", "completion", "ASRWerSubLenCmpHalluDirtyV56", "advantages", "solution"], "data": [["10", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Instead of listening to you, I tell you that from this day forward, I will give that great man a pension of a thousand pieces of gold per month for his life. Nay, though I were to share with him all my riches and provisions.<|im_end|>", 0.7468931674957275, -0.5118773579597473, "instead of listening to you i tell you that from this day forward i will give that great man a pension of a thousand pieces of gold per month for his life nay though i were to share with him all my riches and dominions"], ["10", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Instead of listening to you, I tell you that from this day forward, I will give that great man a pension of a thousand pieces of gold per month for his life. Nay, though I were to share with him all my riches and dominions.<|im_end|>", 0.7513310313224792, -0.21503543853759766, "instead of listening to you i tell you that from this day forward i will give that great man a pension of a thousand pieces of gold per month for his life nay though i were to share with him all my riches and dominions"], ["10", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Instead of listening to you, I tell you that from this day forward, I will give that great man a pension of a thousand pieces of gold per month for his life. Nay, though I were to share with him all my riches and dominions.<|im_end|>", 0.7513310313224792, -0.21503543853759766, "instead of listening to you i tell you that from this day forward i will give that great man a pension of a thousand pieces of gold per month for his life nay though i were to share with him all my riches and dominions"], ["10", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Instead of listening to you, I tell you that from this day forward, I will give that great man a pension of a thousand pieces of gold per month for his life. Nay, though I were to share with him all my riches and dominions.<|im_end|>", 0.7513310313224792, -0.21503543853759766, "instead of listening to you i tell you that from this day forward i will give that great man a pension of a thousand pieces of gold per month for his life nay though i were to share with him all my riches and dominions"], ["10", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Instead of listening to you, I tell you that from this day forward, I will give that great man a pension of a thousand pieces of gold per month for his life. Nay, though I were to share with him all my riches and dominions.<|im_end|>", 0.7513310313224792, -0.21503543853759766, "instead of listening to you i tell you that from this day forward i will give that great man a pension of a thousand pieces of gold per month for his life nay though i were to share with him all my riches and dominions"], ["10", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Instead of listening to you, I tell you that from this day forward, I will give that great man a pension of a thousand pieces of gold per month for his life. Nay, though I were to share with him all my riches and dominions.<|im_end|>", 0.7513310313224792, -0.21503543853759766, "instead of listening to you i tell you that from this day forward i will give that great man a pension of a thousand pieces of gold per month for his life nay though i were to share with him all my riches and dominions"], ["10", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Instead of listening to you, I tell you that from this day forward, I will give that great man a pension of a thousand pieces of gold per month for his life. Nay, though I were to share with him all my riches and privileges.<|im_end|>", 0.7445108890533447, -0.6712242960929871, "instead of listening to you i tell you that from this day forward i will give that great man a pension of a thousand pieces of gold per month for his life nay though i were to share with him all my riches and dominions"], ["10", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Instead of listening to you, I tell you that from this day forward, I will give that great man a pension of a thousand pieces of gold per month for his life nay, though I were to share with him all my riches and dominions.<|im_end|>", 0.8011671900749207, 3.1184284687042236, "instead of listening to you i tell you that from this day forward i will give that great man a pension of a thousand pieces of gold per month for his life nay though i were to share with him all my riches and dominions"], ["10", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Instead of listening to you, I tell you that from this day forward, I will give that great man a pension of a thousand pieces of gold per month for his life. Nay, though I were to share with him all my riches and dominions.<|im_end|>", 0.7513310313224792, -0.21503543853759766, "instead of listening to you i tell you that from this day forward i will give that great man a pension of a thousand pieces of gold per month for his life nay though i were to share with him all my riches and dominions"], ["10", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Instead of listening to you, I tell you that from this day forward, I will give that great man a pension of a thousand pieces of gold per month for his life. Nay, though I were to share with him all my riches and dominions.<|im_end|>", 0.7513310313224792, -0.21503543853759766, "instead of listening to you i tell you that from this day forward i will give that great man a pension of a thousand pieces of gold per month for his life nay though i were to share with him all my riches and dominions"], ["10", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Instead of listening to you, I tell you that from this day forward, I will give that great man a pension of a thousand pieces of gold per month for his life. Nay, though I were to share with him all my riches and dominions.<|im_end|>", 0.7513310313224792, -0.21503543853759766, "instead of listening to you i tell you that from this day forward i will give that great man a pension of a thousand pieces of gold per month for his life nay though i were to share with him all my riches and dominions"], ["10", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Instead of listening to you, I tell you that from this day forward, I will give that great man a pension of a thousand pieces of gold per month for his life. Nay, though I were to share with him all my riches and dominions.<|im_end|>", 0.7513310313224792, -0.21503543853759766, "instead of listening to you i tell you that from this day forward i will give that great man a pension of a thousand pieces of gold per month for his life nay though i were to share with him all my riches and dominions"], ["10", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>The baker shook his head, but the crime which I have committed now or has just passed on me of justice and you can only deliver me from it by blessing us secretly as you have just done come up handed said the procurator.<|im_end|>", -0.15717686712741852, -1.0923786163330078, "The beggar shook his head. The crime which I have committed, my lord, has no call upon human justice. And you can only deliver me from it by blessing me frequently, as you have just done. Come be candid, said the coadjutor."], ["10", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>The beggar shook his head. The crime which I have committed, my lord, has no place among you in justice, and you can only deliver me from it by blessing me frequently as you have just done. Come, I command it said the procurator.<|im_end|>", 0.34490713477134705, 0.8904600739479065, "The beggar shook his head. The crime which I have committed, my lord, has no call upon human justice. And you can only deliver me from it by blessing me frequently, as you have just done. Come be candid, said the coadjutor."], ["10", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>The baker shook his head, the crime which I have committed now or has been called a thing of justice and you can only deliver me from it by blessing as frequently as you have just done come up hand said the procurator.<|im_end|>", -0.093899667263031, -0.8424832224845886, "The beggar shook his head. The crime which I have committed, my lord, has no call upon human justice. And you can only deliver me from it by blessing me frequently, as you have just done. Come be candid, said the coadjutor."], ["10", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>The baker shook his head, the crime which I have committed my lord has no place in human justice, and you can only deliver me from it by blessing me secretly as you have just done. Come, let's end it said the procurator.<|im_end|>", 0.19140377640724182, 0.2842419743537903, "The beggar shook his head. The crime which I have committed, my lord, has no call upon human justice. And you can only deliver me from it by blessing me frequently, as you have just done. Come be candid, said the coadjutor."], ["10", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>The beggar shook his head, the crime which I have committed now or has been called upon me in justice and you can only deliver me from it by blessing me frequently as you have just done come up hand said the procurator.<|im_end|>", 0.13035276532173157, 0.0431382916867733, "The beggar shook his head. The crime which I have committed, my lord, has no call upon human justice. And you can only deliver me from it by blessing me frequently, as you have just done. Come be candid, said the coadjutor."], ["10", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>The baker shook his head. The crime which I have committed, my lord, has no cause of human justice. And you can only deliver me from it by blessing me frequently as you have just done. Come, put hand before the prosecutor.<|im_end|>", 0.4522962272167206, 1.3145629167556763, "The beggar shook his head. The crime which I have committed, my lord, has no call upon human justice. And you can only deliver me from it by blessing me frequently, as you have just done. Come be candid, said the coadjutor."], ["10", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>The baker shook his head, the crime which I have committed now would have no place among you in justice and you can only deliver me from it by blessing me frequently as you have just done come with candids said the procurator.<|im_end|>", -0.018617816269397736, -0.5451788902282715, "The beggar shook his head. The crime which I have committed, my lord, has no call upon human justice. And you can only deliver me from it by blessing me frequently, as you have just done. Come be candid, said the coadjutor."], ["10", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>The baker shook his head, the crime which I have committed now or has already caused me no justice, and you can only deliver me from it by blessing me secretly as you have just done. Come with candids said the prelate judge.<|im_end|>", 0.04945759102702141, -0.276334285736084, "The beggar shook his head. The crime which I have committed, my lord, has no call upon human justice. And you can only deliver me from it by blessing me frequently, as you have just done. Come be candid, said the coadjutor."], ["10", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>The beggar shook his head. The crime which I have committed, my lord, has no cause of human justice. And you can only deliver me from it by blessing me secretly as you have just done. Come up hanged said the persecutor.<|im_end|>", 0.6505840420722961, 2.097644567489624, "The beggar shook his head. The crime which I have committed, my lord, has no call upon human justice. And you can only deliver me from it by blessing me frequently, as you have just done. Come be candid, said the coadjutor."], ["10", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>The baker shook his head, the crime which I have committed now will be called by you injustice, and you can only deliver me from it by blessing us secretly as we have just done come up handed said the presider.<|im_end|>", -0.1792697161436081, -1.1796281337738037, "The beggar shook his head. The crime which I have committed, my lord, has no call upon human justice. And you can only deliver me from it by blessing me frequently, as you have just done. Come be candid, said the coadjutor."], ["10", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>The baker shook his head, the crime which I have committed now would have no place among you in justice and you can only deliver me from it by blessing me frequently as you have just done come with candids said the procurator.<|im_end|>", -0.018617816269397736, -0.5451788902282715, "The beggar shook his head. The crime which I have committed, my lord, has no call upon human justice. And you can only deliver me from it by blessing me frequently, as you have just done. Come be candid, said the coadjutor."], ["10", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>The baker shook his head. The crime which I have committed, my lord, has no place among men of justice, and you can only deliver me from it by blessing us frequently as you have just done come, I command it said the prelate jer.<|im_end|>", 0.08173446357250214, -0.1488659381866455, "The beggar shook his head. The crime which I have committed, my lord, has no call upon human justice. And you can only deliver me from it by blessing me frequently, as you have just done. Come be candid, said the coadjutor."], ["10", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>So she had buttons up, and they were gradually accumulating with the emotions that stirred within one's mind for a perverse bush way. And his seeming grey matter now stirred the remembrance that but a year before, that women were riding the house you mean the shepherd<|im_end|>", -0.7879099249839783, -0.19305643439292908, "the buttons on phelan's coat were fairly undulating with the emotions that stirred within him in his seething gray matter there stirred the remembrance that bateato had told him that women were robbing the house you mean the women"], ["10", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>So she did what was her favorite secret and tried to meditate with the emotions that stirred within one at first bushwick's heart in his seeming grey matter there stirred the remembrance that but a year ago he had been glummed for riding the house you mean to say it<|im_end|>", -1.2214081287384033, -1.8504221439361572, "the buttons on phelan's coat were fairly undulating with the emotions that stirred within him in his seething gray matter there stirred the remembrance that bateato had told him that women were robbing the house you mean the women"], ["10", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Buttons had failed to wake him, and he was still accumulating with the emotions that stirred within him when he first bushwacked in his seething grey matter there stirred the remembrance that battyappo had told him that women were riding the house you mean a woman.<|im_end|>", -0.3585851192474365, 1.4483534097671509, "the buttons on phelan's coat were fairly undulating with the emotions that stirred within him in his seething gray matter there stirred the remembrance that bateato had told him that women were robbing the house you mean the women"], ["10", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>So she did buttons of phaeton's face, and her accumulating with the emotions that stirred within him when he thought of those bushwhackers in his seething grey matter there stirred the remembrance that batty applewood had been there when they were riding the house you mean the sheriff<|im_end|>", -0.7295647859573364, 0.03001077100634575, "the buttons on phelan's coat were fairly undulating with the emotions that stirred within him in his seething gray matter there stirred the remembrance that bateato had told him that women were robbing the house you mean the women"], ["10", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Shall button some favorite speaker and start accumulating with the emotions that stirred within one heart from verse bushwick's in seeming gray matter there stirred the remembrance that but a year before that women were riding the house you mean to show me<|im_end|>", -0.5899039506912231, 0.5639670491218567, "the buttons on phelan's coat were fairly undulating with the emotions that stirred within him in his seething gray matter there stirred the remembrance that bateato had told him that women were robbing the house you mean the women"], ["10", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>So she'd bought some papers, and they kept accumulating with the emotions that stirred within one head from a first bushwick incident in seeming grey matter that stirred the remembrance that but a year before, that women were riding the house you mean the sheriff<|im_end|>", -0.8270294070243835, -0.3426194489002228, "the buttons on phelan's coat were fairly undulating with the emotions that stirred within him in his seething gray matter there stirred the remembrance that bateato had told him that women were robbing the house you mean the women"], ["10", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>To shiver buttons on pavements and paving stones, accumulating with the emotions that stirred within one night from a first bush walk in his seemingly gray matter there stirred the remembrance that boccali had told them women were robbing the house you mean the sheriff.<|im_end|>", -0.24420489370822906, 1.8856559991836548, "the buttons on phelan's coat were fairly undulating with the emotions that stirred within him in his seething gray matter there stirred the remembrance that bateato had told him that women were robbing the house you mean the women"], ["10", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>So she did what had some failing to break in, but he was accumulating with the emotions that stirred within him when he first met her. His seeming gray matter then stirred the remembrance that monte agello told him that women were riding the house you mean a woman?<|im_end|>", -0.9054762721061707, -0.6425402760505676, "the buttons on phelan's coat were fairly undulating with the emotions that stirred within him in his seething gray matter there stirred the remembrance that bateato had told him that women were robbing the house you mean the women"], ["10", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>But some failing brain, in struggling with the emotions that stirred within one's mind from the first bushwackings, had succeeded in gray matter to restore the remembrance that botyappo told them that women were robbing the house you mean a woman<|im_end|>", -0.6036410331726074, 0.5114469528198242, "the buttons on phelan's coat were fairly undulating with the emotions that stirred within him in his seething gray matter there stirred the remembrance that bateato had told him that women were robbing the house you mean the women"], ["10", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>What was on pailor's face, as she lay there accumulating with the emotions that stirred within one night from her first bush walk? It seemed in gray matter that stirred the remembrance that battyata had told them women were riding the house you mean a woman.<|im_end|>", -0.8083580732345581, -0.27123454213142395, "the buttons on phelan's coat were fairly undulating with the emotions that stirred within him in his seething gray matter there stirred the remembrance that bateato had told him that women were robbing the house you mean the women"], ["10", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>So she did what tongues of phalanx waited and eagerly accumulating with the emotions that stirred within one heart for hours bushwick's voice in seeming grey matter had stirred the remembrance that buffy applewood knew that women were rotting the house you mean a servant?<|im_end|>", -0.9248790740966797, -0.716721773147583, "the buttons on phelan's coat were fairly undulating with the emotions that stirred within him in his seething gray matter there stirred the remembrance that bateato had told him that women were robbing the house you mean the women"], ["10", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>So she had bought some table scraps and was very jubilating with the emotions that stirred within her when I first bushwaked. In his seeming gray matter, there stirred the remembrance that but a year before, that women were riding the house. You mean no shit.<|im_end|>", -0.848011314868927, -0.4228382110595703, "the buttons on phelan's coat were fairly undulating with the emotions that stirred within him in his seething gray matter there stirred the remembrance that bateato had told him that women were robbing the house you mean the women"], ["10", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>They set up the side show early in the morning before the first guests arrived at park.<|im_end|>", 0.7450000047683716, 0.012902800925076008, "They set up the sideshow early in the morning before the first guests arrived at park."], ["10", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>They set up the sideshow early in the morning before the first guest arrived at park.<|im_end|>", 0.8543975949287415, 0.8922801613807678, "They set up the sideshow early in the morning before the first guests arrived at park."], ["10", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>They set up the side show early in the morning before the first guests arrived at park.<|im_end|>", 0.7450000047683716, 0.012902800925076008, "They set up the sideshow early in the morning before the first guests arrived at park."], ["10", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>They set up the sideshow early in the morning before the first guests arrived at park.<|im_end|>", 1.0, 2.062685012817383, "They set up the sideshow early in the morning before the first guests arrived at park."], ["10", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>They set up the side show early in the morning before the first guest arrived at park.<|im_end|>", 0.5806475877761841, -1.3082213401794434, "They set up the sideshow early in the morning before the first guests arrived at park."], ["10", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>They set up the side show early in the morning before the first guests arrived at park.<|im_end|>", 0.7450000047683716, 0.012902800925076008, "They set up the sideshow early in the morning before the first guests arrived at park."], ["10", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>They set up the side show early in the morning before the first guest arrived at park.<|im_end|>", 0.5806475877761841, -1.3082213401794434, "They set up the sideshow early in the morning before the first guests arrived at park."], ["10", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>They set up the side show early in the morning before the first guest arrived at park.<|im_end|>", 0.5806475877761841, -1.3082213401794434, "They set up the sideshow early in the morning before the first guests arrived at park."], ["10", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>They set up the side show early in the morning before the first guests arrived at park.<|im_end|>", 0.7450000047683716, 0.012902800925076008, "They set up the sideshow early in the morning before the first guests arrived at park."], ["10", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>They set up the side show early in the morning before the first guests arrived at park.<|im_end|>", 0.7450000047683716, 0.012902800925076008, "They set up the sideshow early in the morning before the first guests arrived at park."], ["10", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>They set up the sideshow early in the morning before the first guest arrived at park.<|im_end|>", 0.8543975949287415, 0.8922801613807678, "They set up the sideshow early in the morning before the first guests arrived at park."], ["10", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>They set up the side show early in the morning before the first guests arrived at park.<|im_end|>", 0.7450000047683716, 0.012902800925076008, "They set up the sideshow early in the morning before the first guests arrived at park."]]}
|
wandb/run-20260417_125349-3c0s7mq3/files/output.log
ADDED
|
@@ -0,0 +1,76 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
wandb: Detected [openai] in use.
|
| 2 |
+
wandb: Use W&B Weave for improved LLM call tracing. Install Weave with `pip install weave` then add `import weave` to the top of your script.
|
| 3 |
+
wandb: For more information, check out the docs at: https://weave-docs.wandb.ai/
|
| 4 |
+
Train: 0%| | 0/9327 [00:00<?, ?it/s]Could not estimate the number of tokens of the input, floating-point operations will not be computed
|
| 5 |
+
[DEBUG generate] shape= (12, 245) last_col_pad_cnt= 0 first_col_pad_cnt= 0
|
| 6 |
+
[DEBUG _encode] has_resp= True prompt_len= 245 resp_len= 59 full_len= 304 label_non_ignore= 59
|
| 7 |
+
[DEBUG _encode] has_resp= True prompt_len= 245 resp_len= 53 full_len= 298 label_non_ignore= 53
|
| 8 |
+
[DEBUG _encode] has_resp= True prompt_len= 245 resp_len= 53 full_len= 298 label_non_ignore= 53
|
| 9 |
+
[DEBUG _encode] has_resp= True prompt_len= 245 resp_len= 54 full_len= 299 label_non_ignore= 54
|
| 10 |
+
[DEBUG _encode] has_resp= True prompt_len= 245 resp_len= 49 full_len= 294 label_non_ignore= 49
|
| 11 |
+
[DEBUG _encode] has_resp= True prompt_len= 245 resp_len= 60 full_len= 305 label_non_ignore= 60
|
| 12 |
+
[DEBUG _encode] has_resp= True prompt_len= 245 resp_len= 57 full_len= 302 label_non_ignore= 57
|
| 13 |
+
[DEBUG _encode] has_resp= True prompt_len= 245 resp_len= 55 full_len= 300 label_non_ignore= 55
|
| 14 |
+
[DEBUG _encode] has_resp= True prompt_len= 245 resp_len= 60 full_len= 305 label_non_ignore= 60
|
| 15 |
+
[DEBUG _encode] has_resp= True prompt_len= 245 resp_len= 51 full_len= 296 label_non_ignore= 51
|
| 16 |
+
[DEBUG generate] shape= (12, 245) last_col_pad_cnt= 0 first_col_pad_cnt= 0
|
| 17 |
+
[DEBUG generate] shape= (12, 74) last_col_pad_cnt= 0 first_col_pad_cnt= 0
|
| 18 |
+
[DEBUG generate] shape= (12, 74) last_col_pad_cnt= 0 first_col_pad_cnt= 0
|
| 19 |
+
Train: 0%| | 8/9327 [05:07<97:17:19, 37.58s/it]
|
| 20 |
+
{'loss': 0.00335923, 'grad_norm': 0.40496424, 'learning_rate': 1.8e-07, 'completions/mean_length': 46.63020992, 'completions/min_length': 29.0, 'completions/max_length': 62.5, 'completions/clipped_ratio': 0.0, 'reward': -0.39390102, 'reward_std': 0.14572198, 'frac_reward_zero_std': 0.0, 'rewards/ASRWerSubLenCmpHalluDirtyV56/mean': -0.39390099, 'rewards/ASRWerSubLenCmpHalluDirtyV56/std': 0.2566371, 'kl': 0.0, 'clip_ratio/low_mean': 0.0, 'clip_ratio/low_min': 0.0, 'clip_ratio/high_mean': 0.0, 'clip_ratio/high_max': 0.0, 'clip_ratio/region_mean': 0.0, 'step_time': 22.53670275, 'epoch': 0.0, 'global_step/max_steps': '1/9327', 'elapsed_time': '45s', 'remaining_time': '4d 21h 45m 37s', 'memory(GiB)': 6.6, 'train_speed(s/it)': 45.457502}
|
| 21 |
+
[DEBUG generate] shape= (12, 250) last_col_pad_cnt= 0 first_col_pad_cnt= 0
|
| 22 |
+
[DEBUG generate] shape= (12, 250) last_col_pad_cnt= 0 first_col_pad_cnt= 0
|
| 23 |
+
[DEBUG generate] shape= (12, 226) last_col_pad_cnt= 0 first_col_pad_cnt= 0
|
| 24 |
+
[DEBUG generate] shape= (12, 226) last_col_pad_cnt= 0 first_col_pad_cnt= 0
|
| 25 |
+
[DEBUG generate] shape= (12, 249) last_col_pad_cnt= 0 first_col_pad_cnt= 0
|
| 26 |
+
[DEBUG generate] shape= (12, 249) last_col_pad_cnt= 0 first_col_pad_cnt= 0
|
| 27 |
+
[DEBUG generate] shape= (12, 255) last_col_pad_cnt= 0 first_col_pad_cnt= 0
|
| 28 |
+
[DEBUG generate] shape= (12, 255) last_col_pad_cnt= 0 first_col_pad_cnt= 0
|
| 29 |
+
[DEBUG generate] shape= (12, 257) last_col_pad_cnt= 0 first_col_pad_cnt= 0
|
| 30 |
+
[DEBUG generate] shape= (12, 257) last_col_pad_cnt= 0 first_col_pad_cnt= 0
|
| 31 |
+
[DEBUG generate] shape= (12, 244) last_col_pad_cnt= 0 first_col_pad_cnt= 0
|
| 32 |
+
[DEBUG generate] shape= (12, 244) last_col_pad_cnt= 0 first_col_pad_cnt= 0
|
| 33 |
+
[DEBUG generate] shape= (12, 253) last_col_pad_cnt= 0 first_col_pad_cnt= 0
|
| 34 |
+
[DEBUG generate] shape= (12, 253) last_col_pad_cnt= 0 first_col_pad_cnt= 0
|
| 35 |
+
[DEBUG generate] shape= (12, 254) last_col_pad_cnt= 0 first_col_pad_cnt= 0
|
| 36 |
+
[DEBUG generate] shape= (12, 254) last_col_pad_cnt= 0 first_col_pad_cnt= 0
|
| 37 |
+
{'loss': 0.00341008, 'grad_norm': 0.55847734, 'learning_rate': 8.9e-07, 'completions/mean_length': 50.98437619, 'completions/min_length': 33.875, 'completions/max_length': 64.0625, 'completions/clipped_ratio': 0.0, 'reward': -0.02726497, 'reward_std': 0.16105477, 'frac_reward_zero_std': 0.0, 'rewards/ASRWerSubLenCmpHalluDirtyV56/mean': -0.02726497, 'rewards/ASRWerSubLenCmpHalluDirtyV56/std': 0.40726903, 'kl': 0.0036334, 'clip_ratio/low_mean': 0.01024817, 'clip_ratio/low_min': 0.00230935, 'clip_ratio/high_mean': 0.0056009, 'clip_ratio/high_max': 0.01153785, 'clip_ratio/region_mean': 0.01584908, 'step_time': 18.11644147, 'epoch': 0.0, 'global_step/max_steps': '5/9327', 'elapsed_time': '3m 15s', 'remaining_time': '4d 5h 3m 13s', 'memory(GiB)': 6.7, 'train_speed(s/it)': 39.025256}
|
| 38 |
+
[DEBUG generate] shape= (12, 239) last_col_pad_cnt= 0 first_col_pad_cnt= 0
|
| 39 |
+
[DEBUG generate] shape= (12, 239) last_col_pad_cnt= 0 first_col_pad_cnt= 0
|
| 40 |
+
[DEBUG generate] shape= (12, 246) last_col_pad_cnt= 0 first_col_pad_cnt= 0
|
| 41 |
+
[DEBUG generate] shape= (12, 246) last_col_pad_cnt= 0 first_col_pad_cnt= 0
|
| 42 |
+
[DEBUG generate] shape= (12, 135) last_col_pad_cnt= 0 first_col_pad_cnt= 0
|
| 43 |
+
[DEBUG generate] shape= (12, 135) last_col_pad_cnt= 0 first_col_pad_cnt= 0
|
| 44 |
+
[DEBUG generate] shape= (12, 221) last_col_pad_cnt= 0 first_col_pad_cnt= 0
|
| 45 |
+
[DEBUG generate] shape= (12, 221) last_col_pad_cnt= 0 first_col_pad_cnt= 0
|
| 46 |
+
[DEBUG generate] shape= (12, 244) last_col_pad_cnt= 0 first_col_pad_cnt= 0
|
| 47 |
+
[DEBUG generate] shape= (12, 244) last_col_pad_cnt= 0 first_col_pad_cnt= 0
|
| 48 |
+
[DEBUG generate] shape= (12, 236) last_col_pad_cnt= 0 first_col_pad_cnt= 0
|
| 49 |
+
[DEBUG generate] shape= (12, 236) last_col_pad_cnt= 0 first_col_pad_cnt= 0
|
| 50 |
+
[DEBUG generate] shape= (12, 244) last_col_pad_cnt= 0 first_col_pad_cnt= 0
|
| 51 |
+
[DEBUG generate] shape= (12, 244) last_col_pad_cnt= 0 first_col_pad_cnt= 0
|
| 52 |
+
[DEBUG generate] shape= (12, 244) last_col_pad_cnt= 0 first_col_pad_cnt= 0
|
| 53 |
+
[DEBUG generate] shape= (12, 244) last_col_pad_cnt= 0 first_col_pad_cnt= 0
|
| 54 |
+
[DEBUG generate] shape= (12, 236) last_col_pad_cnt= 0 first_col_pad_cnt= 0
|
| 55 |
+
[DEBUG generate] shape= (12, 236) last_col_pad_cnt= 0 first_col_pad_cnt= 0
|
| 56 |
+
[DEBUG generate] shape= (12, 238) last_col_pad_cnt= 0 first_col_pad_cnt= 0
|
| 57 |
+
[DEBUG generate] shape= (12, 238) last_col_pad_cnt= 0 first_col_pad_cnt= 0
|
| 58 |
+
{'loss': 0.00361177, 'grad_norm': 0.37292629, 'learning_rate': 1.79e-06, 'completions/mean_length': 51.17916794, 'completions/min_length': 35.95, 'completions/max_length': 65.9, 'completions/clipped_ratio': 0.0, 'reward': -0.01967886, 'reward_std': 0.1592014, 'frac_reward_zero_std': 0.0, 'rewards/ASRWerSubLenCmpHalluDirtyV56/mean': -0.01967885, 'rewards/ASRWerSubLenCmpHalluDirtyV56/std': 0.47400118, 'kl': 0.00512733, 'clip_ratio/low_mean': 0.01430356, 'clip_ratio/low_min': 0.00256842, 'clip_ratio/high_mean': 0.00864687, 'clip_ratio/high_max': 0.01792681, 'clip_ratio/region_mean': 0.02295043, 'step_time': 18.99083556, 'epoch': 0.0, 'global_step/max_steps': '10/9327', 'elapsed_time': '6m 28s', 'remaining_time': '4d 4h 26m 47s', 'memory(GiB)': 6.7, 'train_speed(s/it)': 38.811493}
|
| 59 |
+
[DEBUG generate] shape= (12, 223) last_col_pad_cnt= 0 first_col_pad_cnt= 0
|
| 60 |
+
[DEBUG generate] shape= (12, 223) last_col_pad_cnt= 0 first_col_pad_cnt= 0
|
| 61 |
+
[DEBUG generate] shape= (12, 241) last_col_pad_cnt= 0 first_col_pad_cnt= 0
|
| 62 |
+
[DEBUG generate] shape= (12, 241) last_col_pad_cnt= 0 first_col_pad_cnt= 0
|
| 63 |
+
[DEBUG generate] shape= (12, 193) last_col_pad_cnt= 0 first_col_pad_cnt= 0
|
| 64 |
+
[DEBUG generate] shape= (12, 193) last_col_pad_cnt= 0 first_col_pad_cnt= 0
|
| 65 |
+
[DEBUG generate] shape= (12, 246) last_col_pad_cnt= 0 first_col_pad_cnt= 0
|
| 66 |
+
[DEBUG generate] shape= (12, 246) last_col_pad_cnt= 0 first_col_pad_cnt= 0
|
| 67 |
+
[DEBUG generate] shape= (12, 252) last_col_pad_cnt= 0 first_col_pad_cnt= 0
|
| 68 |
+
[DEBUG generate] shape= (12, 252) last_col_pad_cnt= 0 first_col_pad_cnt= 0
|
| 69 |
+
[DEBUG generate] shape= (12, 252) last_col_pad_cnt= 0 first_col_pad_cnt= 0
|
| 70 |
+
[DEBUG generate] shape= (12, 252) last_col_pad_cnt= 0 first_col_pad_cnt= 0
|
| 71 |
+
[DEBUG generate] shape= (12, 248) last_col_pad_cnt= 0 first_col_pad_cnt= 0
|
| 72 |
+
[DEBUG generate] shape= (12, 248) last_col_pad_cnt= 0 first_col_pad_cnt= 0
|
| 73 |
+
[DEBUG generate] shape= (12, 231) last_col_pad_cnt= 0 first_col_pad_cnt= 0
|
| 74 |
+
[DEBUG generate] shape= (12, 231) last_col_pad_cnt= 0 first_col_pad_cnt= 0
|
| 75 |
+
[DEBUG generate] shape= (12, 247) last_col_pad_cnt= 0 first_col_pad_cnt= 0
|
| 76 |
+
[DEBUG generate] shape= (12, 247) last_col_pad_cnt= 0 first_col_pad_cnt= 0
|
wandb/run-20260417_125349-3c0s7mq3/files/requirements.txt
ADDED
|
@@ -0,0 +1,255 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
psutil==7.2.2
|
| 2 |
+
colorama==0.4.6
|
| 3 |
+
typing-inspection==0.4.2
|
| 4 |
+
dill==0.3.8
|
| 5 |
+
aliyun-python-sdk-kms==2.16.5
|
| 6 |
+
urllib3==2.6.3
|
| 7 |
+
torch==2.6.0
|
| 8 |
+
threadpoolctl==3.6.0
|
| 9 |
+
pyzmq==27.1.0
|
| 10 |
+
astor==0.8.1
|
| 11 |
+
hf-xet==1.4.3
|
| 12 |
+
sniffio==1.3.1
|
| 13 |
+
tensorboard==2.20.0
|
| 14 |
+
fastar==0.11.0
|
| 15 |
+
llvmlite==0.43.0
|
| 16 |
+
pathspec==1.0.4
|
| 17 |
+
mkl_fft==1.3.11
|
| 18 |
+
prometheus_client==0.25.0
|
| 19 |
+
async-timeout==5.0.1
|
| 20 |
+
scikit-learn==1.7.2
|
| 21 |
+
sortedcontainers==2.4.0
|
| 22 |
+
Bottleneck==1.4.2
|
| 23 |
+
orjson==3.11.8
|
| 24 |
+
nest-asyncio==1.6.0
|
| 25 |
+
cupy-cuda12x==13.6.0
|
| 26 |
+
semantic-version==2.10.0
|
| 27 |
+
aiosignal==1.4.0
|
| 28 |
+
fsspec==2025.3.0
|
| 29 |
+
dyNET38==2.2
|
| 30 |
+
shellingham==1.5.4
|
| 31 |
+
zstandard==0.25.0
|
| 32 |
+
PyYAML==6.0.3
|
| 33 |
+
nvidia-curand-cu12==10.3.5.147
|
| 34 |
+
gradio==5.50.0
|
| 35 |
+
Werkzeug==3.1.8
|
| 36 |
+
grpcio==1.80.0
|
| 37 |
+
aiohttp==3.13.5
|
| 38 |
+
Flask==3.1.3
|
| 39 |
+
python-json-logger==4.1.0
|
| 40 |
+
trl==0.29.1
|
| 41 |
+
nltk==3.9.4
|
| 42 |
+
platformdirs==4.9.6
|
| 43 |
+
lm-format-enforcer==0.10.12
|
| 44 |
+
pyparsing==3.3.2
|
| 45 |
+
jmespath==0.10.0
|
| 46 |
+
starlette==0.52.1
|
| 47 |
+
crcmod==1.7
|
| 48 |
+
dnspython==2.8.0
|
| 49 |
+
antlr4-python3-runtime==4.9.3
|
| 50 |
+
rouge==1.0.1
|
| 51 |
+
importlib_metadata==9.0.0
|
| 52 |
+
nvidia-cudnn-cu12==9.1.0.70
|
| 53 |
+
safetensors==0.7.0
|
| 54 |
+
blake3==1.0.8
|
| 55 |
+
interegular==0.3.3
|
| 56 |
+
tiktoken==0.11.0
|
| 57 |
+
pydantic_core==2.41.4
|
| 58 |
+
outlines==0.1.11
|
| 59 |
+
airportsdata==20260315
|
| 60 |
+
rich-toolkit==0.19.7
|
| 61 |
+
multiprocess==0.70.16
|
| 62 |
+
sympy==1.13.1
|
| 63 |
+
psutil==7.2.2
|
| 64 |
+
h11==0.16.0
|
| 65 |
+
anyio==4.13.0
|
| 66 |
+
Cython==3.2.4
|
| 67 |
+
outlines_core==0.1.26
|
| 68 |
+
jsonschema==4.26.0
|
| 69 |
+
nvidia-cuda-cupti-cu12==12.4.127
|
| 70 |
+
meson-python==0.19.0
|
| 71 |
+
depyf==0.18.0
|
| 72 |
+
audioread==3.1.0
|
| 73 |
+
typer==0.24.1
|
| 74 |
+
nvidia-cuda-nvrtc-cu12==12.4.127
|
| 75 |
+
joblib==1.5.3
|
| 76 |
+
torchvision==0.21.0
|
| 77 |
+
hf-gradio==0.3.2
|
| 78 |
+
huggingface_hub==0.36.2
|
| 79 |
+
websockets==15.0.1
|
| 80 |
+
diskcache==5.6.3
|
| 81 |
+
mistral_common==1.11.0
|
| 82 |
+
partial-json-parser==0.2.1.1.post7
|
| 83 |
+
simplejson==3.20.2
|
| 84 |
+
watchfiles==1.1.1
|
| 85 |
+
Jinja2==3.1.6
|
| 86 |
+
GitPython==3.1.46
|
| 87 |
+
numexpr==2.11.0
|
| 88 |
+
pydub==0.25.1
|
| 89 |
+
brotli==1.2.0
|
| 90 |
+
binpacking==2.0.1
|
| 91 |
+
cmake==4.3.1
|
| 92 |
+
pydantic==2.12.3
|
| 93 |
+
mkl-service==2.4.0
|
| 94 |
+
protobuf==6.33.6
|
| 95 |
+
gguf==0.10.0
|
| 96 |
+
MarkupSafe==3.0.3
|
| 97 |
+
exceptiongroup==1.3.1
|
| 98 |
+
markdown-it-py==4.0.0
|
| 99 |
+
soxr==1.0.0
|
| 100 |
+
pyarrow==20.0.0
|
| 101 |
+
tqdm==4.67.3
|
| 102 |
+
meson==1.11.0
|
| 103 |
+
fonttools==4.62.1
|
| 104 |
+
annotated-types==0.7.0
|
| 105 |
+
networkx==3.4.2
|
| 106 |
+
nvidia-cuda-runtime-cu12==12.4.127
|
| 107 |
+
compressed-tensors==0.9.2
|
| 108 |
+
wandb==0.23.0
|
| 109 |
+
mdurl==0.1.2
|
| 110 |
+
charset-normalizer==3.4.7
|
| 111 |
+
Pygments==2.20.0
|
| 112 |
+
zipp==3.23.1
|
| 113 |
+
prometheus-fastapi-instrumentator==7.1.0
|
| 114 |
+
aiofiles==24.1.0
|
| 115 |
+
lark==1.2.2
|
| 116 |
+
addict==2.4.0
|
| 117 |
+
pydantic-settings==2.13.1
|
| 118 |
+
opencv-python-headless==4.11.0.86
|
| 119 |
+
certifi==2026.2.25
|
| 120 |
+
sox==1.5.0
|
| 121 |
+
nagisa==0.2.11
|
| 122 |
+
six==1.17.0
|
| 123 |
+
tokenizers==0.22.2
|
| 124 |
+
mkl_random==1.2.8
|
| 125 |
+
fastapi-cloud-cli==0.17.0
|
| 126 |
+
propcache==0.4.1
|
| 127 |
+
cachetools==7.0.5
|
| 128 |
+
rpds-py==0.30.0
|
| 129 |
+
torchaudio==2.6.0
|
| 130 |
+
setuptools==82.0.1
|
| 131 |
+
py-cpuinfo==9.0.0
|
| 132 |
+
tomli==2.4.1
|
| 133 |
+
xxhash==3.6.0
|
| 134 |
+
pip==26.0.1
|
| 135 |
+
contourpy==1.3.2
|
| 136 |
+
absl-py==2.4.0
|
| 137 |
+
mpmath==1.3.0
|
| 138 |
+
ms_swift==4.0.3
|
| 139 |
+
pyproject-metadata==0.11.0
|
| 140 |
+
aiohappyeyeballs==2.6.1
|
| 141 |
+
httpx==0.28.1
|
| 142 |
+
json_repair==0.59.4
|
| 143 |
+
blinker==1.9.0
|
| 144 |
+
tzdata==2025.3
|
| 145 |
+
tensorboard-data-server==0.7.2
|
| 146 |
+
pydantic-extra-types==2.11.1
|
| 147 |
+
Markdown==3.10.2
|
| 148 |
+
nvidia-cusparselt-cu12==0.6.2
|
| 149 |
+
rignore==0.7.6
|
| 150 |
+
openai==2.32.0
|
| 151 |
+
soundfile==0.13.1
|
| 152 |
+
lazy-loader==0.5
|
| 153 |
+
av==14.2.0
|
| 154 |
+
yarl==1.23.0
|
| 155 |
+
python-dateutil==2.9.0.post0
|
| 156 |
+
groovy==0.1.2
|
| 157 |
+
xformers==0.0.29.post2
|
| 158 |
+
qwen-omni-utils==0.0.9
|
| 159 |
+
rich==15.0.0
|
| 160 |
+
xgrammar==0.1.16
|
| 161 |
+
numba==0.60.0
|
| 162 |
+
nvidia-cusolver-cu12==11.6.1.9
|
| 163 |
+
scikit_build_core==0.12.2
|
| 164 |
+
ffmpy==1.0.0
|
| 165 |
+
wheel==0.46.3
|
| 166 |
+
jiter==0.14.0
|
| 167 |
+
oss2==2.19.1
|
| 168 |
+
transformers==4.57.6
|
| 169 |
+
fastrlock==0.8.3
|
| 170 |
+
click==8.3.2
|
| 171 |
+
pooch==1.9.0
|
| 172 |
+
distro==1.9.0
|
| 173 |
+
nvidia-cublas-cu12==12.4.5.8
|
| 174 |
+
regex==2026.4.4
|
| 175 |
+
cpm-kernels==1.0.11
|
| 176 |
+
safehttpx==0.1.7
|
| 177 |
+
matplotlib==3.10.8
|
| 178 |
+
httptools==0.7.1
|
| 179 |
+
nvidia-cusparse-cu12==12.3.1.170
|
| 180 |
+
qwen-asr==0.0.6
|
| 181 |
+
gradio_client==1.14.0
|
| 182 |
+
gitdb==4.0.12
|
| 183 |
+
fastapi-cli==0.0.24
|
| 184 |
+
soynlp==0.0.493
|
| 185 |
+
python-dotenv==1.2.2
|
| 186 |
+
nvidia-cufft-cu12==11.2.1.3
|
| 187 |
+
accelerate==1.12.0
|
| 188 |
+
tomlkit==0.13.3
|
| 189 |
+
triton==3.2.0
|
| 190 |
+
filelock==3.28.0
|
| 191 |
+
pycountry==26.2.16
|
| 192 |
+
modelscope==1.35.4
|
| 193 |
+
annotated-doc==0.0.4
|
| 194 |
+
referencing==0.37.0
|
| 195 |
+
numpy==1.26.4
|
| 196 |
+
aliyun-python-sdk-core==2.16.0
|
| 197 |
+
attrs==26.1.0
|
| 198 |
+
vllm==0.8.0
|
| 199 |
+
python-multipart==0.0.26
|
| 200 |
+
jsonschema-specifications==2025.9.1
|
| 201 |
+
idna==3.11
|
| 202 |
+
scipy==1.15.3
|
| 203 |
+
typing_extensions==4.15.0
|
| 204 |
+
itsdangerous==2.2.0
|
| 205 |
+
msgspec==0.21.1
|
| 206 |
+
msgpack==1.1.2
|
| 207 |
+
nvidia-nvjitlink-cu12==12.4.127
|
| 208 |
+
pycryptodome==3.23.0
|
| 209 |
+
ninja==1.13.0
|
| 210 |
+
pillow==11.3.0
|
| 211 |
+
email-validator==2.3.0
|
| 212 |
+
cryptography==46.0.7
|
| 213 |
+
peft==0.18.1
|
| 214 |
+
kiwisolver==1.5.0
|
| 215 |
+
cffi==2.0.0
|
| 216 |
+
einops==0.8.2
|
| 217 |
+
pytz==2026.1.post1
|
| 218 |
+
uvloop==0.22.1
|
| 219 |
+
requests==2.33.1
|
| 220 |
+
sentencepiece==0.2.1
|
| 221 |
+
attrdict==2.0.1
|
| 222 |
+
dacite==1.9.2
|
| 223 |
+
cloudpickle==3.1.2
|
| 224 |
+
ray==2.55.0
|
| 225 |
+
fastapi==0.135.3
|
| 226 |
+
librosa==0.11.0
|
| 227 |
+
ruff==0.15.10
|
| 228 |
+
multidict==6.7.1
|
| 229 |
+
smmap==5.0.3
|
| 230 |
+
packaging==26.0
|
| 231 |
+
pycparser==3.0
|
| 232 |
+
decorator==5.2.1
|
| 233 |
+
transformers-stream-generator==0.0.5
|
| 234 |
+
nvidia-nccl-cu12==2.21.5
|
| 235 |
+
frozenlist==1.8.0
|
| 236 |
+
uvicorn==0.44.0
|
| 237 |
+
datasets==3.6.0
|
| 238 |
+
cycler==0.12.1
|
| 239 |
+
omegaconf==2.3.0
|
| 240 |
+
httpcore==1.0.9
|
| 241 |
+
pandas==2.3.2
|
| 242 |
+
nvidia-nvtx-cu12==12.4.127
|
| 243 |
+
sentry-sdk==2.58.0
|
| 244 |
+
wheel==0.46.3
|
| 245 |
+
autocommand==2.2.2
|
| 246 |
+
tomli==2.4.0
|
| 247 |
+
packaging==26.0
|
| 248 |
+
more-itertools==10.8.0
|
| 249 |
+
zipp==3.23.0
|
| 250 |
+
platformdirs==4.4.0
|
| 251 |
+
jaraco.context==6.1.0
|
| 252 |
+
jaraco.text==4.0.0
|
| 253 |
+
backports.tarfile==1.2.0
|
| 254 |
+
jaraco.functools==4.4.0
|
| 255 |
+
importlib_metadata==8.7.1
|
wandb/run-20260417_125349-3c0s7mq3/files/wandb-metadata.json
ADDED
|
@@ -0,0 +1,224 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"os": "Linux-3.10.0-957.el7.x86_64-x86_64-with-glibc2.17",
|
| 3 |
+
"python": "CPython 3.10.18",
|
| 4 |
+
"startedAt": "2026-04-17T04:53:49.174280Z",
|
| 5 |
+
"args": [
|
| 6 |
+
"--rlhf_type",
|
| 7 |
+
"grpo",
|
| 8 |
+
"--external_plugins",
|
| 9 |
+
"/mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/0416upload/my_qwen3_asr_dapo_register.py",
|
| 10 |
+
"/mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/0416upload/0417_reward.py",
|
| 11 |
+
"--model",
|
| 12 |
+
"/mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/qwen3-asr-merged",
|
| 13 |
+
"--model_type",
|
| 14 |
+
"my_qwen3_asr_rl",
|
| 15 |
+
"--template",
|
| 16 |
+
"my_qwen3_asr_rl",
|
| 17 |
+
"--dataset",
|
| 18 |
+
"/mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/0416upload/lora_0323_10w+55w+error+syn_with_domain_train90_targeted_rl_train90_loramerged_basewer_3suppress_server.jsonl",
|
| 19 |
+
"--val_dataset",
|
| 20 |
+
"/mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/0416upload/lora_0323_10w+55w+error+syn_with_domain_train90_targeted_rl_val5_sample5p_server.jsonl",
|
| 21 |
+
"--reward_funcs",
|
| 22 |
+
"asr_wer_sub_len_cmp_hallu_dirty_v56",
|
| 23 |
+
"--train_type",
|
| 24 |
+
"lora",
|
| 25 |
+
"--use_vllm",
|
| 26 |
+
"false",
|
| 27 |
+
"--log_completions",
|
| 28 |
+
"true",
|
| 29 |
+
"--loss_type",
|
| 30 |
+
"dapo",
|
| 31 |
+
"--advantage_estimator",
|
| 32 |
+
"grpo",
|
| 33 |
+
"--scale_rewards",
|
| 34 |
+
"group",
|
| 35 |
+
"--num_iterations",
|
| 36 |
+
"2",
|
| 37 |
+
"--beta",
|
| 38 |
+
"0.04",
|
| 39 |
+
"--epsilon_high",
|
| 40 |
+
"0.28",
|
| 41 |
+
"--dynamic_sample",
|
| 42 |
+
"true",
|
| 43 |
+
"--max_resample_times",
|
| 44 |
+
"4",
|
| 45 |
+
"--overlong_filter",
|
| 46 |
+
"true",
|
| 47 |
+
"--truncation_strategy",
|
| 48 |
+
"delete",
|
| 49 |
+
"--num_generations",
|
| 50 |
+
"12",
|
| 51 |
+
"--generation_batch_size",
|
| 52 |
+
"48",
|
| 53 |
+
"--per_device_train_batch_size",
|
| 54 |
+
"4",
|
| 55 |
+
"--per_device_eval_batch_size",
|
| 56 |
+
"4",
|
| 57 |
+
"--gradient_accumulation_steps",
|
| 58 |
+
"12",
|
| 59 |
+
"--num_generations_eval",
|
| 60 |
+
"4",
|
| 61 |
+
"--max_completion_length",
|
| 62 |
+
"256",
|
| 63 |
+
"--temperature",
|
| 64 |
+
"0.50",
|
| 65 |
+
"--top_p",
|
| 66 |
+
"0.95",
|
| 67 |
+
"--top_k",
|
| 68 |
+
"50",
|
| 69 |
+
"--repetition_penalty",
|
| 70 |
+
"1.08",
|
| 71 |
+
"--learning_rate",
|
| 72 |
+
"5e-5",
|
| 73 |
+
"--lr_scheduler_type",
|
| 74 |
+
"cosine",
|
| 75 |
+
"--warmup_ratio",
|
| 76 |
+
"0.03",
|
| 77 |
+
"--report_to",
|
| 78 |
+
"wandb",
|
| 79 |
+
"--run_name",
|
| 80 |
+
"qwen3asr_dapo_reward56_4x4x12_12gen_4GPU",
|
| 81 |
+
"--output_dir",
|
| 82 |
+
"/mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/0416upload/out/qwen3asr_dapo_reward56_4x4x12_12gen_4GPU",
|
| 83 |
+
"--save_strategy",
|
| 84 |
+
"steps",
|
| 85 |
+
"--save_steps",
|
| 86 |
+
"20",
|
| 87 |
+
"--logging_steps",
|
| 88 |
+
"5",
|
| 89 |
+
"--freeze_llm",
|
| 90 |
+
"false",
|
| 91 |
+
"--freeze_vit",
|
| 92 |
+
"false",
|
| 93 |
+
"--freeze_aligner",
|
| 94 |
+
"false",
|
| 95 |
+
"--remove_unused_columns",
|
| 96 |
+
"false",
|
| 97 |
+
"--padding_side",
|
| 98 |
+
"left"
|
| 99 |
+
],
|
| 100 |
+
"program": "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/lib/python3.10/site-packages/swift/cli/rlhf.py",
|
| 101 |
+
"email": "pang_kaiyu@163.com",
|
| 102 |
+
"root": "/mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/0416upload",
|
| 103 |
+
"host": "SH-IDC1-10-140-37-28",
|
| 104 |
+
"executable": "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/bin/python3.10",
|
| 105 |
+
"cpu_count": 64,
|
| 106 |
+
"cpu_count_logical": 128,
|
| 107 |
+
"gpu": "NVIDIA A100-SXM4-80GB",
|
| 108 |
+
"gpu_count": 8,
|
| 109 |
+
"disk": {
|
| 110 |
+
"/": {
|
| 111 |
+
"total": "524945911808",
|
| 112 |
+
"used": "49879580672"
|
| 113 |
+
}
|
| 114 |
+
},
|
| 115 |
+
"memory": {
|
| 116 |
+
"total": "1081627828224"
|
| 117 |
+
},
|
| 118 |
+
"gpu_nvidia": [
|
| 119 |
+
{
|
| 120 |
+
"name": "NVIDIA A100-SXM4-80GB",
|
| 121 |
+
"memoryTotal": "85899345920",
|
| 122 |
+
"cudaCores": 6912,
|
| 123 |
+
"architecture": "Ampere",
|
| 124 |
+
"uuid": "GPU-3da6624c-f6f7-fce6-4711-27acab73dc93"
|
| 125 |
+
},
|
| 126 |
+
{
|
| 127 |
+
"name": "NVIDIA A100-SXM4-80GB",
|
| 128 |
+
"memoryTotal": "85899345920",
|
| 129 |
+
"cudaCores": 6912,
|
| 130 |
+
"architecture": "Ampere",
|
| 131 |
+
"uuid": "GPU-dae83544-a631-a3fe-b5d5-e4fdd056c7a8"
|
| 132 |
+
},
|
| 133 |
+
{
|
| 134 |
+
"name": "NVIDIA A100-SXM4-80GB",
|
| 135 |
+
"memoryTotal": "85899345920",
|
| 136 |
+
"cudaCores": 6912,
|
| 137 |
+
"architecture": "Ampere",
|
| 138 |
+
"uuid": "GPU-621aa0b9-4a32-d349-8a16-20b8b6f0dde4"
|
| 139 |
+
},
|
| 140 |
+
{
|
| 141 |
+
"name": "NVIDIA A100-SXM4-80GB",
|
| 142 |
+
"memoryTotal": "85899345920",
|
| 143 |
+
"cudaCores": 6912,
|
| 144 |
+
"architecture": "Ampere",
|
| 145 |
+
"uuid": "GPU-642bed5e-3bf1-b5e0-8aba-33f8f64a5dcc"
|
| 146 |
+
},
|
| 147 |
+
{
|
| 148 |
+
"name": "NVIDIA A100-SXM4-80GB",
|
| 149 |
+
"memoryTotal": "85899345920",
|
| 150 |
+
"cudaCores": 6912,
|
| 151 |
+
"architecture": "Ampere",
|
| 152 |
+
"uuid": "GPU-6c70bd3b-1e58-bd2a-a10b-19891e3eab9a"
|
| 153 |
+
},
|
| 154 |
+
{
|
| 155 |
+
"name": "NVIDIA A100-SXM4-80GB",
|
| 156 |
+
"memoryTotal": "85899345920",
|
| 157 |
+
"cudaCores": 6912,
|
| 158 |
+
"architecture": "Ampere",
|
| 159 |
+
"uuid": "GPU-96e9e2d3-6436-3c7f-5a20-1d4a32e7992c"
|
| 160 |
+
},
|
| 161 |
+
{
|
| 162 |
+
"name": "NVIDIA A100-SXM4-80GB",
|
| 163 |
+
"memoryTotal": "85899345920",
|
| 164 |
+
"cudaCores": 6912,
|
| 165 |
+
"architecture": "Ampere",
|
| 166 |
+
"uuid": "GPU-dba7546f-0cda-e659-ca1d-4790c27ffe8d"
|
| 167 |
+
},
|
| 168 |
+
{
|
| 169 |
+
"name": "NVIDIA A100-SXM4-80GB",
|
| 170 |
+
"memoryTotal": "85899345920",
|
| 171 |
+
"cudaCores": 6912,
|
| 172 |
+
"architecture": "Ampere",
|
| 173 |
+
"uuid": "GPU-b0a96cf9-74f3-969a-e8d0-5a30f3f06d1e"
|
| 174 |
+
}
|
| 175 |
+
],
|
| 176 |
+
"cudaVersion": "12.4",
|
| 177 |
+
"slurm": {
|
| 178 |
+
"cluster_name": "cluster_sproject3",
|
| 179 |
+
"conf": "/etc/slurm/slurm.conf",
|
| 180 |
+
"cpus_on_node": "2",
|
| 181 |
+
"gtids": "0",
|
| 182 |
+
"job_account": "research",
|
| 183 |
+
"job_cpus_per_node": "2",
|
| 184 |
+
"job_gid": "800000689",
|
| 185 |
+
"job_id": "8568855",
|
| 186 |
+
"job_name": "qwen3_asr_train_4gpu",
|
| 187 |
+
"job_nodelist": "SH-IDC1-10-140-37-28",
|
| 188 |
+
"job_num_nodes": "1",
|
| 189 |
+
"job_partition": "interntmp",
|
| 190 |
+
"job_qos": "normal",
|
| 191 |
+
"job_uid": "800000689",
|
| 192 |
+
"job_user": "panjiabao",
|
| 193 |
+
"jobid": "8568855",
|
| 194 |
+
"launch_node_ipaddr": "10.140.37.164",
|
| 195 |
+
"localid": "0",
|
| 196 |
+
"nnodes": "1",
|
| 197 |
+
"nodeid": "0",
|
| 198 |
+
"nodelist": "SH-IDC1-10-140-37-28",
|
| 199 |
+
"nprocs": "1",
|
| 200 |
+
"ntasks": "1",
|
| 201 |
+
"ntasks_per_node": "1",
|
| 202 |
+
"prio_process": "0",
|
| 203 |
+
"procid": "0",
|
| 204 |
+
"srun_comm_host": "10.140.37.164",
|
| 205 |
+
"srun_comm_port": "39944",
|
| 206 |
+
"step_gpus": "4,5,6,7",
|
| 207 |
+
"step_id": "0",
|
| 208 |
+
"step_launcher_port": "39944",
|
| 209 |
+
"step_nodelist": "SH-IDC1-10-140-37-28",
|
| 210 |
+
"step_num_nodes": "1",
|
| 211 |
+
"step_num_tasks": "1",
|
| 212 |
+
"step_tasks_per_node": "1",
|
| 213 |
+
"stepid": "0",
|
| 214 |
+
"submit_dir": "/mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/0416upload",
|
| 215 |
+
"submit_host": "SH-IDC1-10-140-37-164",
|
| 216 |
+
"task_pid": "253884",
|
| 217 |
+
"tasks_per_node": "1",
|
| 218 |
+
"topology_addr": "SH-IDC1-10-140-37-28",
|
| 219 |
+
"topology_addr_pattern": "node",
|
| 220 |
+
"umask": "0002",
|
| 221 |
+
"working_cluster": "cluster_sproject3:SH-IDC1-10-140-37-161:6817:9216:109"
|
| 222 |
+
},
|
| 223 |
+
"writerId": "j5sm4ok14e8glxftszvcldkdpfaj9tjk"
|
| 224 |
+
}
|
wandb/run-20260417_125349-3c0s7mq3/files/wandb-summary.json
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"profiling/Time taken: GRPOTrainer._prepare_inputs":1.0380055755376816e-05,"train/clip_ratio/low_min":0.0025684179776969056,"completions":{"artifact_path":"wandb-client-artifact://uxb8hpe90ova7jczka8irjgjvda1abucqjkcj2xforoqlkmgy8m2ogk528hkqzciqt27cmh80q6ooyt95k6jpzt8j12bp5out3isrdz6jt3e0rqqyb8j8sbkeuw9z88u/completions.table.json","ncols":6,"sha256":"510c5f07b145276e42100fb7a1579a1a90630c3d4b603b455e0179b2425e7ba9","size":27491,"log_mode":"IMMUTABLE","_latest_artifact_path":"wandb-client-artifact://c0nc1huy2dg0glf8439n1pxjl0jfm9ih2xohqkvhrckav2b6emj75t25u8r70nmykdappetknoyherfthhsx0dnv0iba9azrtgonx2q7fd4ur4g65wplov58boq40hos:latest/completions.table.json","nrows":48,"_type":"table-file","path":"media/table/completions_5_510c5f07b145276e4210.table.json"},"train/step_time":18.990835564490407,"profiling/Time taken: GRPOTrainer._generate_and_score_completions":6.459590430138633,"profiling/Time taken: GRPOTrainer._dynamic_sampling":0.0027582282200455666,"train/frac_reward_zero_std":0,"train/rewards/ASRWerSubLenCmpHalluDirtyV56/mean":-0.01967885121703148,"train/completions/clipped_ratio":0,"train/clip_ratio/high_max":0.01792680664608876,"train/epoch":0.0032164683177870698,"profiling/Time taken: GRPOTrainer.compute_loss":0.42181658814661205,"train/kl":0.005127331020776183,"_step":6,"train/clip_ratio/region_mean":0.022950426349416374,"train/clip_ratio/low_mean":0.014303557314754774,"train/rewards/ASRWerSubLenCmpHalluDirtyV56/std":0.4740011841058731,"profiling/Time taken: GRPOTrainer.log_metrics":0.021599401021376252,"profiling/Time taken: GRPOTrainer.resample_encode_failed_inputs":0.09793815203011036,"train/learning_rate":1.7857142857142857e-06,"train/clip_ratio/high_mean":0.008646869304357097,"train/reward":-0.019678859598934652,"train/completions/mean_length":51.179167938232425,"train/grad_norm":0.3729262948036194,"train/completions/max_length":65.9,"train/reward_std":0.15920140147209166,"train/completions/min_length":35.95,"train/loss":0.003611765429377556,"_timestamp":1.7764021900309644e+09,"_wandb":{"runtime":559},"profiling/Time taken: GRPOTrainer._get_per_token_logps_and_entropies":0.3787236858624965,"profiling/Time taken: GRPOTrainer._prepare_batch_inputs":1.4868471620138735,"profiling/Time taken: GRPOTrainer._score_completions":0.1824264999013394,"profiling/Time taken: GRPOTrainer.generate":4.603045840980485,"_runtime":559.310393838,"train/global_step":10,"profiling/Time taken: GRPOTrainer.ASRWerSubLenCmpHalluDirtyV56":0.18123672483488917}
|
wandb/run-20260417_125349-3c0s7mq3/logs/debug-core.log
ADDED
|
@@ -0,0 +1,11 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{"time":"2026-04-17T12:53:49.510806063+08:00","level":"INFO","msg":"main: starting server","port-filename":"/tmp/tmp9sgje0qy/port-255159.txt","pid":255159,"log-level":0,"disable-analytics":false,"shutdown-on-parent-exit":false,"enable-dcgm-profiling":false}
|
| 2 |
+
{"time":"2026-04-17T12:53:49.512883475+08:00","level":"INFO","msg":"server: will exit if parent process dies","ppid":255159}
|
| 3 |
+
{"time":"2026-04-17T12:53:49.512897523+08:00","level":"INFO","msg":"server: accepting connections","addr":{"Name":"/tmp/wandb-255159-255838-1984267321/socket","Net":"unix"}}
|
| 4 |
+
{"time":"2026-04-17T12:53:49.589507097+08:00","level":"INFO","msg":"connection: ManageConnectionData: new connection created","id":"1(@)"}
|
| 5 |
+
{"time":"2026-04-17T12:53:49.596836313+08:00","level":"INFO","msg":"handleInformInit: received","streamId":"3c0s7mq3","id":"1(@)"}
|
| 6 |
+
{"time":"2026-04-17T12:53:50.060383382+08:00","level":"INFO","msg":"handleInformInit: stream started","streamId":"3c0s7mq3","id":"1(@)"}
|
| 7 |
+
{"time":"2026-04-17T13:03:10.120189546+08:00","level":"INFO","msg":"handleInformTeardown: server teardown initiated","id":"1(@)"}
|
| 8 |
+
{"time":"2026-04-17T13:03:10.120718112+08:00","level":"INFO","msg":"server is shutting down"}
|
| 9 |
+
{"time":"2026-04-17T13:03:10.120709431+08:00","level":"INFO","msg":"connection: closing","id":"1(@)"}
|
| 10 |
+
{"time":"2026-04-17T13:03:10.1212097+08:00","level":"INFO","msg":"server: listener closed","addr":{"Name":"/tmp/wandb-255159-255838-1984267321/socket","Net":"unix"}}
|
| 11 |
+
{"time":"2026-04-17T13:03:10.121584463+08:00","level":"INFO","msg":"connection: closed successfully","id":"1(@)"}
|
wandb/run-20260417_125349-3c0s7mq3/logs/debug-internal.log
ADDED
|
@@ -0,0 +1,11 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{"time":"2026-04-17T12:53:49.599295874+08:00","level":"INFO","msg":"stream: starting","core version":"0.23.0"}
|
| 2 |
+
{"time":"2026-04-17T12:53:50.056880322+08:00","level":"INFO","msg":"stream: created new stream","id":"3c0s7mq3"}
|
| 3 |
+
{"time":"2026-04-17T12:53:50.056952984+08:00","level":"INFO","msg":"handler: started","stream_id":"3c0s7mq3"}
|
| 4 |
+
{"time":"2026-04-17T12:53:50.060375782+08:00","level":"INFO","msg":"stream: started","id":"3c0s7mq3"}
|
| 5 |
+
{"time":"2026-04-17T12:53:50.060385935+08:00","level":"INFO","msg":"sender: started","stream_id":"3c0s7mq3"}
|
| 6 |
+
{"time":"2026-04-17T12:53:50.060388859+08:00","level":"INFO","msg":"writer: started","stream_id":"3c0s7mq3"}
|
| 7 |
+
{"time":"2026-04-17T13:03:10.120719587+08:00","level":"INFO","msg":"stream: closing","id":"3c0s7mq3"}
|
| 8 |
+
{"time":"2026-04-17T13:03:11.075949443+08:00","level":"INFO","msg":"fileTransfer: Close: file transfer manager closed"}
|
| 9 |
+
{"time":"2026-04-17T13:03:12.765331132+08:00","level":"INFO","msg":"handler: closed","stream_id":"3c0s7mq3"}
|
| 10 |
+
{"time":"2026-04-17T13:03:12.766657126+08:00","level":"INFO","msg":"sender: closed","stream_id":"3c0s7mq3"}
|
| 11 |
+
{"time":"2026-04-17T13:03:12.766668686+08:00","level":"INFO","msg":"stream: closed","id":"3c0s7mq3"}
|
wandb/run-20260417_125349-3c0s7mq3/logs/debug.log
ADDED
|
@@ -0,0 +1,26 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
2026-04-17 12:53:49,233 INFO MainThread:255159 [wandb_setup.py:_flush():80] Current SDK version is 0.23.0
|
| 2 |
+
2026-04-17 12:53:49,233 INFO MainThread:255159 [wandb_setup.py:_flush():80] Configure stats pid to 255159
|
| 3 |
+
2026-04-17 12:53:49,233 INFO MainThread:255159 [wandb_setup.py:_flush():80] Loading settings from /mnt/petrelfs/panjiabao/.config/wandb/settings
|
| 4 |
+
2026-04-17 12:53:49,233 INFO MainThread:255159 [wandb_setup.py:_flush():80] Loading settings from /mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/0416upload/wandb/settings
|
| 5 |
+
2026-04-17 12:53:49,233 INFO MainThread:255159 [wandb_setup.py:_flush():80] Loading settings from environment variables
|
| 6 |
+
2026-04-17 12:53:49,233 INFO MainThread:255159 [wandb_init.py:setup_run_log_directory():713] Logging user logs to /mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/0416upload/wandb/run-20260417_125349-3c0s7mq3/logs/debug.log
|
| 7 |
+
2026-04-17 12:53:49,233 INFO MainThread:255159 [wandb_init.py:setup_run_log_directory():714] Logging internal logs to /mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/0416upload/wandb/run-20260417_125349-3c0s7mq3/logs/debug-internal.log
|
| 8 |
+
2026-04-17 12:53:49,233 INFO MainThread:255159 [wandb_init.py:init():840] calling init triggers
|
| 9 |
+
2026-04-17 12:53:49,233 INFO MainThread:255159 [wandb_init.py:init():845] wandb.init called with sweep_config: {}
|
| 10 |
+
config: {'_wandb': {}}
|
| 11 |
+
2026-04-17 12:53:49,233 INFO MainThread:255159 [wandb_init.py:init():888] starting backend
|
| 12 |
+
2026-04-17 12:53:49,589 INFO MainThread:255159 [wandb_init.py:init():891] sending inform_init request
|
| 13 |
+
2026-04-17 12:53:49,594 INFO MainThread:255159 [wandb_init.py:init():899] backend started and connected
|
| 14 |
+
2026-04-17 12:53:49,598 INFO MainThread:255159 [wandb_init.py:init():969] updated telemetry
|
| 15 |
+
2026-04-17 12:53:49,599 INFO MainThread:255159 [wandb_init.py:init():993] communicating run to backend with 90.0 second timeout
|
| 16 |
+
2026-04-17 12:53:50,809 INFO MainThread:255159 [wandb_init.py:init():1040] starting run threads in backend
|
| 17 |
+
2026-04-17 12:53:51,513 INFO MainThread:255159 [wandb_run.py:_console_start():2504] atexit reg
|
| 18 |
+
2026-04-17 12:53:51,514 INFO MainThread:255159 [wandb_run.py:_redirect():2352] redirect: wrap_raw
|
| 19 |
+
2026-04-17 12:53:51,514 INFO MainThread:255159 [wandb_run.py:_redirect():2421] Wrapping output streams.
|
| 20 |
+
2026-04-17 12:53:51,514 INFO MainThread:255159 [wandb_run.py:_redirect():2444] Redirects installed.
|
| 21 |
+
2026-04-17 12:53:51,521 INFO MainThread:255159 [wandb_init.py:init():1080] run started, returning control to user process
|
| 22 |
+
2026-04-17 12:53:51,528 INFO MainThread:255159 [wandb_run.py:_config_callback():1385] config_cb None None {'peft_config': {'default': {'task_type': 'CAUSAL_LM', 'peft_type': 'LORA', 'auto_mapping': None, 'peft_version': '0.18.1', 'base_model_name_or_path': '/mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/qwen3-asr-merged', 'revision': None, 'inference_mode': False, 'r': 8, 'target_modules': '^(thinker\\.model(?=\\.).*\\.(k_proj|q_proj|down_proj|up_proj|v_proj|gate_proj|o_proj)|thinker\\.audio_tower\\.layers(?=\\.).*\\.(k_proj|fc1|fc2|q_proj|out_proj|v_proj)|thinker\\.audio_tower\\.conv_out(?=\\.)|thinker\\.audio_tower\\.proj1(?=\\.)|thinker\\.audio_tower\\.proj2(?=\\.))$', 'exclude_modules': None, 'lora_alpha': 32, 'lora_dropout': 0.05, 'fan_in_fan_out': False, 'bias': 'none', 'use_rslora': False, 'modules_to_save': [], 'init_lora_weights': True, 'layers_to_transform': None, 'layers_pattern': None, 'rank_pattern': {}, 'alpha_pattern': {}, 'megatron_config': None, 'megatron_core': 'megatron.core', 'trainable_token_indices': None, 'loftq_config': {}, 'eva_config': None, 'corda_config': None, 'use_dora': False, 'alora_invocation_tokens': None, 'use_qalora': False, 'qalora_group_size': 16, 'layer_replication': None, 'runtime_config': {'ephemeral_gpu_offload': False}, 'lora_bias': False, 'target_parameters': None, 'arrow_config': None, 'ensure_weight_tying': False, 'lora_dtype': None, 'lorap_lr_ratio': None, 'lorap_emb_lr': 1e-06}}, 'return_dict': True, 'output_hidden_states': False, 'torchscript': False, 'dtype': 'bfloat16', 'pruned_heads': {}, 'tie_word_embeddings': True, 'chunk_size_feed_forward': 0, 'is_encoder_decoder': False, 'is_decoder': False, 'cross_attention_hidden_size': None, 'add_cross_attention': False, 'tie_encoder_decoder': False, 'architectures': ['Qwen3ASRForConditionalGeneration'], 'finetuning_task': None, 'id2label': {0: 'LABEL_0', 1: 'LABEL_1'}, 'label2id': {'LABEL_0': 0, 'LABEL_1': 1}, 'task_specific_params': None, 'problem_type': None, 'tokenizer_class': None, 'prefix': None, 'bos_token_id': None, 'pad_token_id': 151643, 'eos_token_id': 151645, 'sep_token_id': None, 'decoder_start_token_id': None, 'max_length': 20, 'min_length': 0, 'do_sample': False, 'early_stopping': False, 'num_beams': 1, 'temperature': 0.5, 'top_k': 50, 'top_p': 0.95, 'typical_p': 1.0, 'repetition_penalty': 1.08, 'length_penalty': 1.0, 'no_repeat_ngram_size': 0, 'encoder_no_repeat_ngram_size': 0, 'bad_words_ids': None, 'num_return_sequences': 1, 'output_scores': False, 'return_dict_in_generate': False, 'forced_bos_token_id': None, 'forced_eos_token_id': None, 'remove_invalid_values': False, 'exponential_decay_length_penalty': None, 'suppress_tokens': None, 'begin_suppress_tokens': None, 'num_beam_groups': 1, 'diversity_penalty': 0.0, '_name_or_path': '/mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/qwen3-asr-merged', 'transformers_version': '4.57.6', 'model_type': 'qwen3_asr', 'tf_legacy_loss': False, 'use_bfloat16': False, 'thinker_config': {'return_dict': True, 'output_hidden_states': False, 'torchscript': False, 'dtype': 'bfloat16', 'pruned_heads': {}, 'tie_word_embeddings': True, 'chunk_size_feed_forward': 0, 'is_encoder_decoder': False, 'is_decoder': False, 'cross_attention_hidden_size': None, 'add_cross_attention': False, 'tie_encoder_decoder': False, 'architectures': ['Qwen3ASRForConditionalGeneration'], 'finetuning_task': None, 'id2label': {0: 'LABEL_0', 1: 'LABEL_1'}, 'label2id': {'LABEL_0': 0, 'LABEL_1': 1}, 'task_specific_params': None, 'problem_type': None, 'tokenizer_class': None, 'prefix': None, 'bos_token_id': None, 'pad_token_id': None, 'eos_token_id': None, 'sep_token_id': None, 'decoder_start_token_id': None, 'max_length': 20, 'min_length': 0, 'do_sample': False, 'early_stopping': False, 'num_beams': 1, 'temperature': 1.0, 'top_k': 50, 'top_p': 1.0, 'typical_p': 1.0, 'repetition_penalty': 1.0, 'length_penalty': 1.0, 'no_repeat_ngram_size': 0, 'encoder_no_repeat_ngram_size': 0, 'bad_words_ids': None, 'num_return_sequences': 1, 'output_scores': False, 'return_dict_in_generate': False, 'forced_bos_token_id': None, 'forced_eos_token_id': None, 'remove_invalid_values': False, 'exponential_decay_length_penalty': None, 'suppress_tokens': None, 'begin_suppress_tokens': None, 'num_beam_groups': 1, 'diversity_penalty': 0.0, '_name_or_path': '', 'audio_end_token_id': 151670, 'model_type': 'qwen3_asr_thinker', 'tf_legacy_loss': False, 'use_bfloat16': False, 'user_token_id': 872, 'audio_start_token_id': 151669, 'initializer_range': 0.02, 'audio_config': {'return_dict': True, 'output_hidden_states': False, 'torchscript': False, 'dtype': None, 'pruned_heads': {}, 'tie_word_embeddings': True, 'chunk_size_feed_forward': 0, 'is_encoder_decoder': False, 'is_decoder': False, 'cross_attention_hidden_size': None, 'add_cross_attention': False, 'tie_encoder_decoder': False, 'architectures': None, 'finetuning_task': None, 'id2label': {0: 'LABEL_0', 1: 'LABEL_1'}, 'label2id': {'LABEL_0': 0, 'LABEL_1': 1}, 'task_specific_params': None, 'problem_type': None, 'tokenizer_class': None, 'prefix': None, 'bos_token_id': None, 'pad_token_id': None, 'eos_token_id': None, 'sep_token_id': None, 'decoder_start_token_id': None, 'max_length': 20, 'min_length': 0, 'do_sample': False, 'early_stopping': False, 'num_beams': 1, 'temperature': 1.0, 'top_k': 50, 'top_p': 1.0, 'typical_p': 1.0, 'repetition_penalty': 1.0, 'length_penalty': 1.0, 'no_repeat_ngram_size': 0, 'encoder_no_repeat_ngram_size': 0, 'bad_words_ids': None, 'num_return_sequences': 1, 'output_scores': False, 'return_dict_in_generate': False, 'forced_bos_token_id': None, 'forced_eos_token_id': None, 'remove_invalid_values': False, 'exponential_decay_length_penalty': None, 'suppress_tokens': None, 'begin_suppress_tokens': None, 'num_beam_groups': 1, 'diversity_penalty': 0.0, '_name_or_path': '', 'model_type': 'qwen3_asr_audio_encoder', 'num_hidden_layers': 24, 'tf_legacy_loss': False, 'use_bfloat16': False, 'num_mel_bins': 128, 'd_model': 1024, 'encoder_layers': 24, 'encoder_attention_heads': 16, 'encoder_ffn_dim': 4096, 'dropout': 0, 'attention_dropout': 0, 'activation_function': 'gelu', 'activation_dropout': 0, 'initializer_range': 0.02, 'scale_embedding': False, 'max_source_positions': 1500, 'n_window': 50, 'output_dim': 2048, 'n_window_infer': 800, 'conv_chunksize': 500, 'downsample_hidden_size': 480, 'output_attentions': False}, 'text_config': {'vocab_size': 151936, 'max_position_embeddings': 65536, 'hidden_size': 2048, 'intermediate_size': 6144, 'num_hidden_layers': 28, 'num_attention_heads': 16, 'num_key_value_heads': 8, 'head_dim': 128, 'hidden_act': 'silu', 'initializer_range': 0.02, 'rms_norm_eps': 1e-06, 'use_cache': False, 'rope_theta': 1000000, 'rope_scaling': {'interleaved': True, 'mrope_interleaved': True, 'mrope_section': [24, 20, 20], 'rope_type': 'default', 'type': 'default'}, 'attention_bias': False, 'attention_dropout': 0.0, 'return_dict': True, 'output_hidden_states': False, 'torchscript': False, 'dtype': None, 'pruned_heads': {}, 'tie_word_embeddings': True, 'chunk_size_feed_forward': 0, 'is_encoder_decoder': False, 'is_decoder': False, 'cross_attention_hidden_size': None, 'add_cross_attention': False, 'tie_encoder_decoder': False, 'architectures': None, 'finetuning_task': None, 'id2label': {0: 'LABEL_0', 1: 'LABEL_1'}, 'label2id': {'LABEL_0': 0, 'LABEL_1': 1}, 'task_specific_params': None, 'problem_type': None, 'tokenizer_class': None, 'prefix': None, 'bos_token_id': None, 'pad_token_id': 151643, 'eos_token_id': None, 'sep_token_id': None, 'decoder_start_token_id': None, 'max_length': 20, 'min_length': 0, 'do_sample': False, 'early_stopping': False, 'num_beams': 1, 'temperature': 1.0, 'top_k': 50, 'top_p': 1.0, 'typical_p': 1.0, 'repetition_penalty': 1.0, 'length_penalty': 1.0, 'no_repeat_ngram_size': 0, 'encoder_no_repeat_ngram_size': 0, 'bad_words_ids': None, 'num_return_sequences': 1, 'output_scores': False, 'return_dict_in_generate': False, 'forced_bos_token_id': None, 'forced_eos_token_id': None, 'remove_invalid_values': False, 'exponential_decay_length_penalty': None, 'suppress_tokens': None, 'begin_suppress_tokens': None, 'num_beam_groups': 1, 'diversity_penalty': 0.0, '_name_or_path': '', 'model_type': 'qwen3_asr_text', 'tf_legacy_loss': False, 'use_bfloat16': False, 'output_attentions': False}, 'audio_token_id': 151676, 'output_attentions': False}, 'support_languages': ['Chinese', 'English', 'Cantonese', 'Arabic', 'German', 'French', 'Spanish', 'Portuguese', 'Indonesian', 'Italian', 'Korean', 'Russian', 'Thai', 'Vietnamese', 'Japanese', 'Turkish', 'Hindi', 'Malay', 'Dutch', 'Swedish', 'Danish', 'Finnish', 'Polish', 'Czech', 'Filipino', 'Persian', 'Greek', 'Romanian', 'Hungarian', 'Macedonian'], 'output_attentions': False, 'output_dir': '/mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/0416upload/out/qwen3asr_dapo_reward56_4x4x12_12gen_4GPU/v4-20260417-125332', 'overwrite_output_dir': False, 'do_train': False, 'do_eval': True, 'do_predict': False, 'eval_strategy': 'steps', 'prediction_loss_only': False, 'per_device_train_batch_size': 4, 'per_device_eval_batch_size': 4, 'per_gpu_train_batch_size': None, 'per_gpu_eval_batch_size': None, 'gradient_accumulation_steps': 12, 'eval_accumulation_steps': None, 'eval_delay': 0, 'torch_empty_cache_steps': None, 'learning_rate': 5e-05, 'weight_decay': 0.1, 'adam_beta1': 0.9, 'adam_beta2': 0.95, 'adam_epsilon': 1e-08, 'max_grad_norm': 1.0, 'num_train_epochs': 3.0, 'max_steps': -1, 'lr_scheduler_type': 'cosine', 'lr_scheduler_kwargs': None, 'warmup_ratio': 0.03, 'warmup_steps': 0, 'log_level': 'passive', 'log_level_replica': 'warning', 'log_on_each_node': True, 'logging_dir': '/mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/0416upload/out/qwen3asr_dapo_reward56_4x4x12_12gen_4GPU/v4-20260417-125332/runs', 'logging_strategy': 'steps', 'logging_first_step': True, 'logging_steps': 5, 'logging_nan_inf_filter': True, 'save_strategy': 'steps', 'save_steps': 20, 'save_total_limit': None, 'save_safetensors': True, 'save_on_each_node': False, 'save_only_model': False, 'restore_callback_states_from_checkpoint': False, 'no_cuda': False, 'use_cpu': False, 'use_mps_device': False, 'seed': 42, 'data_seed': 42, 'jit_mode_eval': False, 'bf16': True, 'fp16': False, 'fp16_opt_level': 'O1', 'half_precision_backend': 'auto', 'bf16_full_eval': False, 'fp16_full_eval': False, 'tf32': None, 'local_rank': 0, 'ddp_backend': None, 'tpu_num_cores': None, 'tpu_metrics_debug': False, 'debug': [], 'dataloader_drop_last': True, 'eval_steps': 20, 'dataloader_num_workers': 1, 'dataloader_prefetch_factor': 2, 'past_index': -1, 'run_name': 'qwen3asr_dapo_reward56_4x4x12_12gen_4GPU', 'disable_tqdm': False, 'remove_unused_columns': False, 'label_names': None, 'load_best_model_at_end': False, 'metric_for_best_model': 'loss', 'greater_is_better': False, 'ignore_data_skip': False, 'fsdp': [], 'fsdp_min_num_params': 0, 'fsdp_config': {'min_num_params': 0, 'xla': False, 'xla_fsdp_v2': False, 'xla_fsdp_grad_ckpt': False}, 'fsdp_transformer_layer_cls_to_wrap': None, 'accelerator_config': {'split_batches': False, 'dispatch_batches': False, 'even_batches': True, 'use_seedable_sampler': True, 'non_blocking': False, 'gradient_accumulation_kwargs': None}, 'parallelism_config': None, 'deepspeed': None, 'label_smoothing_factor': 0.0, 'optim': 'adamw_torch', 'optim_args': None, 'adafactor': False, 'group_by_length': False, 'length_column_name': 'length', 'report_to': ['wandb'], 'project': 'huggingface', 'trackio_space_id': 'trackio', 'ddp_find_unused_parameters': None, 'ddp_bucket_cap_mb': None, 'ddp_broadcast_buffers': None, 'dataloader_pin_memory': True, 'dataloader_persistent_workers': False, 'skip_memory_metrics': True, 'use_legacy_prediction_loop': False, 'push_to_hub': False, 'resume_from_checkpoint': None, 'hub_model_id': None, 'hub_strategy': 'every_save', 'hub_token': '<HUB_TOKEN>', 'hub_private_repo': None, 'hub_always_push': False, 'hub_revision': None, 'gradient_checkpointing': False, 'gradient_checkpointing_kwargs': None, 'include_inputs_for_metrics': False, 'include_for_metrics': [], 'eval_do_concat_batches': True, 'fp16_backend': 'auto', 'push_to_hub_model_id': None, 'push_to_hub_organization': None, 'push_to_hub_token': '<PUSH_TO_HUB_TOKEN>', 'mp_parameters': '', 'auto_find_batch_size': False, 'full_determinism': False, 'torchdynamo': None, 'ray_scope': 'last', 'ddp_timeout': 18000000, 'torch_compile': False, 'torch_compile_backend': None, 'torch_compile_mode': None, 'include_tokens_per_second': False, 'include_num_input_tokens_seen': 'no', 'neftune_noise_alpha': None, 'optim_target_modules': None, 'batch_eval_metrics': False, 'eval_on_start': False, 'use_liger_kernel': False, 'liger_kernel_config': None, 'eval_use_gather_object': False, 'average_tokens_across_devices': True, 'model_init_kwargs': None, 'disable_dropout': False, 'cast_lm_head_to_fp32': False, 'num_generations': 12, 'num_generations_eval': 4, 'max_completion_length': 256, 'ds3_gather_for_generation': True, 'shuffle_dataset': True, 'generation_batch_size': 48, 'steps_per_generation': 3, 'min_p': None, 'generation_kwargs': None, 'chat_template_kwargs': None, 'use_transformers_paged': False, 'cache_implementation': None, 'use_vllm': False, 'vllm_mode': None, 'vllm_model_impl': 'vllm', 'vllm_enable_sleep_mode': False, 'vllm_structured_outputs_regex': None, 'vllm_server_base_url': None, 'vllm_server_host': None, 'vllm_server_port': [8000], 'vllm_server_timeout': 240.0, 'vllm_group_port': 51216, 'vllm_gpu_memory_utilization': 0.9, 'vllm_max_model_length': None, 'vllm_tensor_parallel_size': 1, 'beta': 0.04, 'num_iterations': 2, 'epsilon': 0.2, 'delta': None, 'epsilon_high': 0.28, 'sapo_temperature_neg': 1.05, 'sapo_temperature_pos': 1.0, 'importance_sampling_level': 'token', 'reward_weights': None, 'multi_objective_aggregation': 'sum_then_normalize', 'scale_rewards': 'group', 'loss_type': 'dapo', 'mask_truncated_completions': False, 'sync_ref_model': False, 'ref_model_mixup_alpha': 0.6, 'ref_model_sync_steps': 512, 'top_entropy_quantile': 1.0, 'max_tool_calling_iterations': None, 'vllm_importance_sampling_correction': True, 'vllm_importance_sampling_mode': 'sequence_mask', 'vllm_importance_sampling_cap': 3.0, 'off_policy_mask_threshold': None, 'use_bias_correction_kl': False, 'log_completions': True, 'num_completions_to_print': None, 'log_unique_prompts': False, 'log_completions_hub_repo': None, 'tuner_backend': 'peft', 'vit_gradient_checkpointing': True, 'router_aux_loss_coef': 0.0, 'enable_dft_loss': False, 'enable_channel_loss': False, 'safe_serialization': True, 'max_shard_size': '5GB', 'check_model': True, 'acc_strategy': 'token', 'train_dataloader_shuffle': True, 'max_epochs': None, 'aligner_lr': None, 'vit_lr': None, 'use_logits_to_keep': None, 'resume_only_model': False, 'optimizer': None, 'eval_metric': None, 'callbacks': [], 'early_stop_interval': None, 'eval_use_evalscope': False, 'eval_dataset': [], 'eval_dataset_args': None, 'eval_limit': None, 'eval_generation_config': None, 'extra_eval_args': None, 'tuner_type': 'lora', 'use_galore': False, 'galore_target_modules': None, 'galore_rank': 128, 'galore_update_proj_gap': 50, 'galore_scale': 1.0, 'galore_proj_type': 'std', 'galore_optim_per_parameter': False, 'galore_with_embedding': False, 'galore_quantization': False, 'galore_proj_quant': False, 'galore_proj_bits': 4, 'galore_proj_group_size': 256, 'galore_cos_threshold': 0.4, 'galore_gamma_proj': 2, 'galore_queue_size': 5, 'lisa_activated_layers': 0, 'lisa_step_interval': 20, 'use_flash_ckpt': False, 'vllm_pipeline_parallel_size': 1, 'vllm_enable_expert_parallel': False, 'vllm_max_num_seqs': None, 'vllm_max_model_len': None, 'vllm_disable_custom_all_reduce': True, 'vllm_enforce_eager': False, 'vllm_limit_mm_per_prompt': None, 'vllm_max_lora_rank': 16, 'vllm_enable_prefix_caching': True, 'vllm_use_async_engine': None, 'vllm_quantization': None, 'vllm_reasoning_parser': None, 'vllm_disable_cascade_attn': False, 'vllm_mm_processor_cache_gb': None, 'vllm_speculative_config': None, 'vllm_engine_kwargs': {}, 'vllm_data_parallel_size': 1, 'stop_words': [], 'vllm_enable_lora': False, 'lora_rank': 8, 'vllm_server_group_port': None, 'enable_flattened_weight_sync': True, 'async_generate': False, 'structured_outputs_regex': None, 'sleep_level': 0, 'move_model_batches': None, 'offload_optimizer': False, 'offload_model': False, 'wandb_log_unique_prompts': None, 'cosine_min_len_value_wrong': -0.5, 'cosine_max_len_value_wrong': 0.0, 'cosine_min_len_value_correct': 1.0, 'cosine_max_len_value_correct': 0.5, 'cosine_max_len': 256, 'repetition_n_grams': 3, 'repetition_max_penalty': -1.0, 'reward_model': None, 'reward_model_plugin': None, 'chord_sft_dataset': [], 'chord_sft_per_device_train_batch_size': None, 'chord_enable_phi_function': False, 'chord_mu_warmup_steps': None, 'chord_mu_decay_steps': None, 'chord_mu_peak': None, 'chord_mu_valley': None, 'multi_turn_scheduler': None, 'max_turns': None, 'completion_length_limit_scope': 'per_round', 'vllm_server_pass_dataset': False, 'dynamic_sample': True, 'max_resample_times': 4, 'overlong_filter': True, 'soft_max_length': None, 'soft_cache_length': None, 'log_entropy': False, 'tau_pos': 1.0, 'tau_neg': 1.05, 'advantage_estimator': 'grpo', 'kl_in_reward': False, 'dataset_shuffle': True, 'rollout_importance_sampling_mode': None, 'rollout_importance_sampling_threshold': 2.0, 'log_rollout_offpolicy_metrics': False, 'off_policy_sequence_mask_delta': None}
|
| 23 |
+
2026-04-17 12:53:51,543 INFO MainThread:255159 [wandb_config.py:__setitem__():154] [no run ID] config set model/num_parameters = 2050307712 - <bound method Run._config_callback of <wandb.sdk.wandb_run.Run object at 0x7fca74e06a70>>
|
| 24 |
+
2026-04-17 12:53:51,543 INFO MainThread:255159 [wandb_run.py:_config_callback():1385] config_cb model/num_parameters 2050307712 None
|
| 25 |
+
2026-04-17 13:03:10,120 INFO wandb-AsyncioManager-main:255159 [service_client.py:_forward_responses():80] Reached EOF.
|
| 26 |
+
2026-04-17 13:03:10,120 INFO wandb-AsyncioManager-main:255159 [mailbox.py:close():137] Closing mailbox, abandoning 1 handles.
|
wandb/run-20260418_172847-c2a5hfz3/files/config.yaml
ADDED
|
@@ -0,0 +1,1262 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
_name_or_path:
|
| 2 |
+
value: /mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/qwen3-asr-merged
|
| 3 |
+
_wandb:
|
| 4 |
+
value:
|
| 5 |
+
cli_version: 0.23.0
|
| 6 |
+
e:
|
| 7 |
+
ess1zs9oqcfvbaak4xbqvnst142xqp1g:
|
| 8 |
+
args:
|
| 9 |
+
- --rlhf_type
|
| 10 |
+
- grpo
|
| 11 |
+
- --external_plugins
|
| 12 |
+
- /mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/0416upload/my_qwen3_asr_dapo_register.py
|
| 13 |
+
- /mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/0416upload/0417_reward.py
|
| 14 |
+
- --model
|
| 15 |
+
- /mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/qwen3-asr-merged
|
| 16 |
+
- --model_type
|
| 17 |
+
- my_qwen3_asr_rl
|
| 18 |
+
- --template
|
| 19 |
+
- my_qwen3_asr_rl
|
| 20 |
+
- --dataset
|
| 21 |
+
- /mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/0416upload/lora_0323_10w+55w+error+syn_with_domain_train90_targeted_rl_train90_loramerged_basewer_3suppress_server.jsonl
|
| 22 |
+
- --val_dataset
|
| 23 |
+
- /mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/0416upload/lora_0323_10w+55w+error+syn_with_domain_train90_targeted_rl_val5_sample5p_server.jsonl
|
| 24 |
+
- --reward_funcs
|
| 25 |
+
- asr_wer_sub_len_cmp_hallu_dirty_v56
|
| 26 |
+
- --train_type
|
| 27 |
+
- lora
|
| 28 |
+
- --use_vllm
|
| 29 |
+
- "false"
|
| 30 |
+
- --log_completions
|
| 31 |
+
- "true"
|
| 32 |
+
- --loss_type
|
| 33 |
+
- dapo
|
| 34 |
+
- --advantage_estimator
|
| 35 |
+
- grpo
|
| 36 |
+
- --scale_rewards
|
| 37 |
+
- group
|
| 38 |
+
- --num_iterations
|
| 39 |
+
- "2"
|
| 40 |
+
- --beta
|
| 41 |
+
- "0.04"
|
| 42 |
+
- --epsilon_high
|
| 43 |
+
- "0.28"
|
| 44 |
+
- --dynamic_sample
|
| 45 |
+
- "true"
|
| 46 |
+
- --max_resample_times
|
| 47 |
+
- "4"
|
| 48 |
+
- --overlong_filter
|
| 49 |
+
- "true"
|
| 50 |
+
- --truncation_strategy
|
| 51 |
+
- delete
|
| 52 |
+
- --num_generations
|
| 53 |
+
- "12"
|
| 54 |
+
- --generation_batch_size
|
| 55 |
+
- "48"
|
| 56 |
+
- --per_device_train_batch_size
|
| 57 |
+
- "4"
|
| 58 |
+
- --per_device_eval_batch_size
|
| 59 |
+
- "4"
|
| 60 |
+
- --gradient_accumulation_steps
|
| 61 |
+
- "12"
|
| 62 |
+
- --num_generations_eval
|
| 63 |
+
- "4"
|
| 64 |
+
- --max_completion_length
|
| 65 |
+
- "256"
|
| 66 |
+
- --temperature
|
| 67 |
+
- "0.50"
|
| 68 |
+
- --top_p
|
| 69 |
+
- "0.95"
|
| 70 |
+
- --top_k
|
| 71 |
+
- "50"
|
| 72 |
+
- --repetition_penalty
|
| 73 |
+
- "1.08"
|
| 74 |
+
- --learning_rate
|
| 75 |
+
- "5e-5"
|
| 76 |
+
- --lr_scheduler_type
|
| 77 |
+
- cosine
|
| 78 |
+
- --warmup_ratio
|
| 79 |
+
- "0.03"
|
| 80 |
+
- --report_to
|
| 81 |
+
- wandb
|
| 82 |
+
- --run_name
|
| 83 |
+
- qwen3asr_dapo_reward56_4x4x12_12gen_4GPU
|
| 84 |
+
- --output_dir
|
| 85 |
+
- /mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/0416upload/out/qwen3asr_dapo_reward56_4x4x12_12gen_4GPU
|
| 86 |
+
- --save_strategy
|
| 87 |
+
- steps
|
| 88 |
+
- --save_steps
|
| 89 |
+
- "20"
|
| 90 |
+
- --logging_steps
|
| 91 |
+
- "5"
|
| 92 |
+
- --freeze_llm
|
| 93 |
+
- "false"
|
| 94 |
+
- --freeze_vit
|
| 95 |
+
- "false"
|
| 96 |
+
- --freeze_aligner
|
| 97 |
+
- "false"
|
| 98 |
+
- --remove_unused_columns
|
| 99 |
+
- "false"
|
| 100 |
+
- --padding_side
|
| 101 |
+
- left
|
| 102 |
+
cpu_count: 64
|
| 103 |
+
cpu_count_logical: 128
|
| 104 |
+
cudaVersion: "12.4"
|
| 105 |
+
disk:
|
| 106 |
+
/:
|
| 107 |
+
total: "524945911808"
|
| 108 |
+
used: "37368901632"
|
| 109 |
+
email: pang_kaiyu@163.com
|
| 110 |
+
executable: /mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/bin/python3.10
|
| 111 |
+
gpu: NVIDIA A100-SXM4-80GB
|
| 112 |
+
gpu_count: 8
|
| 113 |
+
gpu_nvidia:
|
| 114 |
+
- architecture: Ampere
|
| 115 |
+
cudaCores: 6912
|
| 116 |
+
memoryTotal: "85899345920"
|
| 117 |
+
name: NVIDIA A100-SXM4-80GB
|
| 118 |
+
uuid: GPU-87e7e3ab-b254-fc22-7407-8e2e88e9d854
|
| 119 |
+
- architecture: Ampere
|
| 120 |
+
cudaCores: 6912
|
| 121 |
+
memoryTotal: "85899345920"
|
| 122 |
+
name: NVIDIA A100-SXM4-80GB
|
| 123 |
+
uuid: GPU-976db8a1-cf00-11c6-caaa-413862233fd4
|
| 124 |
+
- architecture: Ampere
|
| 125 |
+
cudaCores: 6912
|
| 126 |
+
memoryTotal: "85899345920"
|
| 127 |
+
name: NVIDIA A100-SXM4-80GB
|
| 128 |
+
uuid: GPU-78b37ae8-44e0-e318-a6c0-f6f4ac78d46a
|
| 129 |
+
- architecture: Ampere
|
| 130 |
+
cudaCores: 6912
|
| 131 |
+
memoryTotal: "85899345920"
|
| 132 |
+
name: NVIDIA A100-SXM4-80GB
|
| 133 |
+
uuid: GPU-840b937d-a7d4-68e7-ad57-f4568e01c3ae
|
| 134 |
+
- architecture: Ampere
|
| 135 |
+
cudaCores: 6912
|
| 136 |
+
memoryTotal: "85899345920"
|
| 137 |
+
name: NVIDIA A100-SXM4-80GB
|
| 138 |
+
uuid: GPU-a9d0de54-f5b5-f83b-7bda-f53db844622d
|
| 139 |
+
- architecture: Ampere
|
| 140 |
+
cudaCores: 6912
|
| 141 |
+
memoryTotal: "85899345920"
|
| 142 |
+
name: NVIDIA A100-SXM4-80GB
|
| 143 |
+
uuid: GPU-cb7d22e9-305c-c68c-64f1-599580742db0
|
| 144 |
+
- architecture: Ampere
|
| 145 |
+
cudaCores: 6912
|
| 146 |
+
memoryTotal: "85899345920"
|
| 147 |
+
name: NVIDIA A100-SXM4-80GB
|
| 148 |
+
uuid: GPU-8d9704bb-4592-346f-a7f2-1a6ed8d58619
|
| 149 |
+
- architecture: Ampere
|
| 150 |
+
cudaCores: 6912
|
| 151 |
+
memoryTotal: "85899345920"
|
| 152 |
+
name: NVIDIA A100-SXM4-80GB
|
| 153 |
+
uuid: GPU-3892f01b-e0b8-a9d9-0587-b5a7d2d9b5ab
|
| 154 |
+
host: SH-IDC1-10-140-37-95
|
| 155 |
+
memory:
|
| 156 |
+
total: "1081627828224"
|
| 157 |
+
os: Linux-3.10.0-957.el7.x86_64-x86_64-with-glibc2.17
|
| 158 |
+
program: /mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/lib/python3.10/site-packages/swift/cli/rlhf.py
|
| 159 |
+
python: CPython 3.10.18
|
| 160 |
+
root: /mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/0416upload
|
| 161 |
+
slurm:
|
| 162 |
+
cluster_name: cluster_sproject3
|
| 163 |
+
conf: /etc/slurm/slurm.conf
|
| 164 |
+
cpus_on_node: "2"
|
| 165 |
+
gtids: "0"
|
| 166 |
+
job_account: research
|
| 167 |
+
job_cpus_per_node: "2"
|
| 168 |
+
job_gid: "800000689"
|
| 169 |
+
job_gpus: 0,1,2,6
|
| 170 |
+
job_id: "8574598"
|
| 171 |
+
job_name: qwen3_asr_train_4gpu
|
| 172 |
+
job_nodelist: SH-IDC1-10-140-37-95
|
| 173 |
+
job_num_nodes: "1"
|
| 174 |
+
job_partition: interntmp
|
| 175 |
+
job_qos: normal
|
| 176 |
+
job_uid: "800000689"
|
| 177 |
+
job_user: panjiabao
|
| 178 |
+
jobid: "8574598"
|
| 179 |
+
localid: "0"
|
| 180 |
+
nnodes: "1"
|
| 181 |
+
node_aliases: (null)
|
| 182 |
+
nodeid: "0"
|
| 183 |
+
nodelist: SH-IDC1-10-140-37-95
|
| 184 |
+
nprocs: "1"
|
| 185 |
+
ntasks: "1"
|
| 186 |
+
prio_process: "0"
|
| 187 |
+
procid: "0"
|
| 188 |
+
submit_dir: /mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/0416upload
|
| 189 |
+
submit_host: SH-IDC1-10-140-37-164
|
| 190 |
+
task_pid: "9466"
|
| 191 |
+
tasks_per_node: "1"
|
| 192 |
+
topology_addr: SH-IDC1-10-140-37-95
|
| 193 |
+
topology_addr_pattern: node
|
| 194 |
+
working_cluster: cluster_sproject3:SH-IDC1-10-140-37-161:6817:9216:109
|
| 195 |
+
startedAt: "2026-04-18T09:28:47.432340Z"
|
| 196 |
+
writerId: ess1zs9oqcfvbaak4xbqvnst142xqp1g
|
| 197 |
+
m:
|
| 198 |
+
- "1": train/global_step
|
| 199 |
+
"6":
|
| 200 |
+
- 3
|
| 201 |
+
"7": []
|
| 202 |
+
- "2": '*'
|
| 203 |
+
"5": 1
|
| 204 |
+
"6":
|
| 205 |
+
- 1
|
| 206 |
+
"7": []
|
| 207 |
+
python_version: 3.10.18
|
| 208 |
+
t:
|
| 209 |
+
"1":
|
| 210 |
+
- 1
|
| 211 |
+
- 5
|
| 212 |
+
- 11
|
| 213 |
+
- 30
|
| 214 |
+
- 41
|
| 215 |
+
- 49
|
| 216 |
+
- 51
|
| 217 |
+
- 53
|
| 218 |
+
- 71
|
| 219 |
+
- 84
|
| 220 |
+
- 95
|
| 221 |
+
- 98
|
| 222 |
+
- 105
|
| 223 |
+
"2":
|
| 224 |
+
- 1
|
| 225 |
+
- 5
|
| 226 |
+
- 11
|
| 227 |
+
- 30
|
| 228 |
+
- 41
|
| 229 |
+
- 49
|
| 230 |
+
- 51
|
| 231 |
+
- 53
|
| 232 |
+
- 71
|
| 233 |
+
- 84
|
| 234 |
+
- 95
|
| 235 |
+
- 98
|
| 236 |
+
- 105
|
| 237 |
+
"3":
|
| 238 |
+
- 7
|
| 239 |
+
- 13
|
| 240 |
+
- 19
|
| 241 |
+
- 66
|
| 242 |
+
"4": 3.10.18
|
| 243 |
+
"5": 0.23.0
|
| 244 |
+
"6": 4.57.6
|
| 245 |
+
"9":
|
| 246 |
+
"1": transformers_trainer
|
| 247 |
+
"12": 0.23.0
|
| 248 |
+
"13": linux-x86_64
|
| 249 |
+
acc_strategy:
|
| 250 |
+
value: token
|
| 251 |
+
accelerator_config:
|
| 252 |
+
value:
|
| 253 |
+
dispatch_batches: false
|
| 254 |
+
even_batches: true
|
| 255 |
+
gradient_accumulation_kwargs: null
|
| 256 |
+
non_blocking: false
|
| 257 |
+
split_batches: false
|
| 258 |
+
use_seedable_sampler: true
|
| 259 |
+
adafactor:
|
| 260 |
+
value: false
|
| 261 |
+
adam_beta1:
|
| 262 |
+
value: 0.9
|
| 263 |
+
adam_beta2:
|
| 264 |
+
value: 0.95
|
| 265 |
+
adam_epsilon:
|
| 266 |
+
value: 1e-08
|
| 267 |
+
add_cross_attention:
|
| 268 |
+
value: false
|
| 269 |
+
advantage_estimator:
|
| 270 |
+
value: grpo
|
| 271 |
+
aligner_lr:
|
| 272 |
+
value: null
|
| 273 |
+
architectures:
|
| 274 |
+
value:
|
| 275 |
+
- Qwen3ASRForConditionalGeneration
|
| 276 |
+
async_generate:
|
| 277 |
+
value: false
|
| 278 |
+
auto_find_batch_size:
|
| 279 |
+
value: false
|
| 280 |
+
average_tokens_across_devices:
|
| 281 |
+
value: true
|
| 282 |
+
bad_words_ids:
|
| 283 |
+
value: null
|
| 284 |
+
batch_eval_metrics:
|
| 285 |
+
value: false
|
| 286 |
+
begin_suppress_tokens:
|
| 287 |
+
value: null
|
| 288 |
+
beta:
|
| 289 |
+
value: 0.04
|
| 290 |
+
bf16:
|
| 291 |
+
value: true
|
| 292 |
+
bf16_full_eval:
|
| 293 |
+
value: false
|
| 294 |
+
bos_token_id:
|
| 295 |
+
value: null
|
| 296 |
+
cache_implementation:
|
| 297 |
+
value: null
|
| 298 |
+
callbacks:
|
| 299 |
+
value: []
|
| 300 |
+
cast_lm_head_to_fp32:
|
| 301 |
+
value: false
|
| 302 |
+
chat_template_kwargs:
|
| 303 |
+
value: null
|
| 304 |
+
check_model:
|
| 305 |
+
value: true
|
| 306 |
+
chord_enable_phi_function:
|
| 307 |
+
value: false
|
| 308 |
+
chord_mu_decay_steps:
|
| 309 |
+
value: null
|
| 310 |
+
chord_mu_peak:
|
| 311 |
+
value: null
|
| 312 |
+
chord_mu_valley:
|
| 313 |
+
value: null
|
| 314 |
+
chord_mu_warmup_steps:
|
| 315 |
+
value: null
|
| 316 |
+
chord_sft_dataset:
|
| 317 |
+
value: []
|
| 318 |
+
chord_sft_per_device_train_batch_size:
|
| 319 |
+
value: null
|
| 320 |
+
chunk_size_feed_forward:
|
| 321 |
+
value: 0
|
| 322 |
+
completion_length_limit_scope:
|
| 323 |
+
value: per_round
|
| 324 |
+
cosine_max_len:
|
| 325 |
+
value: 256
|
| 326 |
+
cosine_max_len_value_correct:
|
| 327 |
+
value: 0.5
|
| 328 |
+
cosine_max_len_value_wrong:
|
| 329 |
+
value: 0
|
| 330 |
+
cosine_min_len_value_correct:
|
| 331 |
+
value: 1
|
| 332 |
+
cosine_min_len_value_wrong:
|
| 333 |
+
value: -0.5
|
| 334 |
+
cross_attention_hidden_size:
|
| 335 |
+
value: null
|
| 336 |
+
data_seed:
|
| 337 |
+
value: 42
|
| 338 |
+
dataloader_drop_last:
|
| 339 |
+
value: true
|
| 340 |
+
dataloader_num_workers:
|
| 341 |
+
value: 1
|
| 342 |
+
dataloader_persistent_workers:
|
| 343 |
+
value: false
|
| 344 |
+
dataloader_pin_memory:
|
| 345 |
+
value: true
|
| 346 |
+
dataloader_prefetch_factor:
|
| 347 |
+
value: 2
|
| 348 |
+
dataset_shuffle:
|
| 349 |
+
value: true
|
| 350 |
+
ddp_backend:
|
| 351 |
+
value: null
|
| 352 |
+
ddp_broadcast_buffers:
|
| 353 |
+
value: null
|
| 354 |
+
ddp_bucket_cap_mb:
|
| 355 |
+
value: null
|
| 356 |
+
ddp_find_unused_parameters:
|
| 357 |
+
value: null
|
| 358 |
+
ddp_timeout:
|
| 359 |
+
value: 18000000
|
| 360 |
+
debug:
|
| 361 |
+
value: []
|
| 362 |
+
decoder_start_token_id:
|
| 363 |
+
value: null
|
| 364 |
+
deepspeed:
|
| 365 |
+
value: null
|
| 366 |
+
delta:
|
| 367 |
+
value: null
|
| 368 |
+
disable_dropout:
|
| 369 |
+
value: false
|
| 370 |
+
disable_tqdm:
|
| 371 |
+
value: false
|
| 372 |
+
diversity_penalty:
|
| 373 |
+
value: 0
|
| 374 |
+
do_eval:
|
| 375 |
+
value: true
|
| 376 |
+
do_predict:
|
| 377 |
+
value: false
|
| 378 |
+
do_sample:
|
| 379 |
+
value: false
|
| 380 |
+
do_train:
|
| 381 |
+
value: false
|
| 382 |
+
ds3_gather_for_generation:
|
| 383 |
+
value: true
|
| 384 |
+
dtype:
|
| 385 |
+
value: bfloat16
|
| 386 |
+
dynamic_sample:
|
| 387 |
+
value: true
|
| 388 |
+
early_stop_interval:
|
| 389 |
+
value: null
|
| 390 |
+
early_stopping:
|
| 391 |
+
value: false
|
| 392 |
+
enable_channel_loss:
|
| 393 |
+
value: false
|
| 394 |
+
enable_dft_loss:
|
| 395 |
+
value: false
|
| 396 |
+
enable_flattened_weight_sync:
|
| 397 |
+
value: true
|
| 398 |
+
encoder_no_repeat_ngram_size:
|
| 399 |
+
value: 0
|
| 400 |
+
eos_token_id:
|
| 401 |
+
value: 151645
|
| 402 |
+
epsilon:
|
| 403 |
+
value: 0.2
|
| 404 |
+
epsilon_high:
|
| 405 |
+
value: 0.28
|
| 406 |
+
eval_accumulation_steps:
|
| 407 |
+
value: null
|
| 408 |
+
eval_dataset:
|
| 409 |
+
value: []
|
| 410 |
+
eval_dataset_args:
|
| 411 |
+
value: null
|
| 412 |
+
eval_delay:
|
| 413 |
+
value: 0
|
| 414 |
+
eval_do_concat_batches:
|
| 415 |
+
value: true
|
| 416 |
+
eval_generation_config:
|
| 417 |
+
value: null
|
| 418 |
+
eval_limit:
|
| 419 |
+
value: null
|
| 420 |
+
eval_metric:
|
| 421 |
+
value: null
|
| 422 |
+
eval_on_start:
|
| 423 |
+
value: false
|
| 424 |
+
eval_steps:
|
| 425 |
+
value: 20
|
| 426 |
+
eval_strategy:
|
| 427 |
+
value: steps
|
| 428 |
+
eval_use_evalscope:
|
| 429 |
+
value: false
|
| 430 |
+
eval_use_gather_object:
|
| 431 |
+
value: false
|
| 432 |
+
exponential_decay_length_penalty:
|
| 433 |
+
value: null
|
| 434 |
+
extra_eval_args:
|
| 435 |
+
value: null
|
| 436 |
+
finetuning_task:
|
| 437 |
+
value: null
|
| 438 |
+
forced_bos_token_id:
|
| 439 |
+
value: null
|
| 440 |
+
forced_eos_token_id:
|
| 441 |
+
value: null
|
| 442 |
+
fp16:
|
| 443 |
+
value: false
|
| 444 |
+
fp16_backend:
|
| 445 |
+
value: auto
|
| 446 |
+
fp16_full_eval:
|
| 447 |
+
value: false
|
| 448 |
+
fp16_opt_level:
|
| 449 |
+
value: O1
|
| 450 |
+
fsdp:
|
| 451 |
+
value: []
|
| 452 |
+
fsdp_config:
|
| 453 |
+
value:
|
| 454 |
+
min_num_params: 0
|
| 455 |
+
xla: false
|
| 456 |
+
xla_fsdp_grad_ckpt: false
|
| 457 |
+
xla_fsdp_v2: false
|
| 458 |
+
fsdp_min_num_params:
|
| 459 |
+
value: 0
|
| 460 |
+
fsdp_transformer_layer_cls_to_wrap:
|
| 461 |
+
value: null
|
| 462 |
+
full_determinism:
|
| 463 |
+
value: false
|
| 464 |
+
galore_cos_threshold:
|
| 465 |
+
value: 0.4
|
| 466 |
+
galore_gamma_proj:
|
| 467 |
+
value: 2
|
| 468 |
+
galore_optim_per_parameter:
|
| 469 |
+
value: false
|
| 470 |
+
galore_proj_bits:
|
| 471 |
+
value: 4
|
| 472 |
+
galore_proj_group_size:
|
| 473 |
+
value: 256
|
| 474 |
+
galore_proj_quant:
|
| 475 |
+
value: false
|
| 476 |
+
galore_proj_type:
|
| 477 |
+
value: std
|
| 478 |
+
galore_quantization:
|
| 479 |
+
value: false
|
| 480 |
+
galore_queue_size:
|
| 481 |
+
value: 5
|
| 482 |
+
galore_rank:
|
| 483 |
+
value: 128
|
| 484 |
+
galore_scale:
|
| 485 |
+
value: 1
|
| 486 |
+
galore_target_modules:
|
| 487 |
+
value: null
|
| 488 |
+
galore_update_proj_gap:
|
| 489 |
+
value: 50
|
| 490 |
+
galore_with_embedding:
|
| 491 |
+
value: false
|
| 492 |
+
generation_batch_size:
|
| 493 |
+
value: 48
|
| 494 |
+
generation_kwargs:
|
| 495 |
+
value: null
|
| 496 |
+
gradient_accumulation_steps:
|
| 497 |
+
value: 12
|
| 498 |
+
gradient_checkpointing:
|
| 499 |
+
value: false
|
| 500 |
+
gradient_checkpointing_kwargs:
|
| 501 |
+
value: null
|
| 502 |
+
greater_is_better:
|
| 503 |
+
value: false
|
| 504 |
+
group_by_length:
|
| 505 |
+
value: false
|
| 506 |
+
half_precision_backend:
|
| 507 |
+
value: auto
|
| 508 |
+
hub_always_push:
|
| 509 |
+
value: false
|
| 510 |
+
hub_model_id:
|
| 511 |
+
value: null
|
| 512 |
+
hub_private_repo:
|
| 513 |
+
value: null
|
| 514 |
+
hub_revision:
|
| 515 |
+
value: null
|
| 516 |
+
hub_strategy:
|
| 517 |
+
value: every_save
|
| 518 |
+
hub_token:
|
| 519 |
+
value: <HUB_TOKEN>
|
| 520 |
+
id2label:
|
| 521 |
+
value:
|
| 522 |
+
"0": LABEL_0
|
| 523 |
+
"1": LABEL_1
|
| 524 |
+
ignore_data_skip:
|
| 525 |
+
value: false
|
| 526 |
+
importance_sampling_level:
|
| 527 |
+
value: token
|
| 528 |
+
include_for_metrics:
|
| 529 |
+
value: []
|
| 530 |
+
include_inputs_for_metrics:
|
| 531 |
+
value: false
|
| 532 |
+
include_num_input_tokens_seen:
|
| 533 |
+
value: "no"
|
| 534 |
+
include_tokens_per_second:
|
| 535 |
+
value: false
|
| 536 |
+
is_decoder:
|
| 537 |
+
value: false
|
| 538 |
+
is_encoder_decoder:
|
| 539 |
+
value: false
|
| 540 |
+
jit_mode_eval:
|
| 541 |
+
value: false
|
| 542 |
+
kl_in_reward:
|
| 543 |
+
value: false
|
| 544 |
+
label_names:
|
| 545 |
+
value: null
|
| 546 |
+
label_smoothing_factor:
|
| 547 |
+
value: 0
|
| 548 |
+
label2id:
|
| 549 |
+
value:
|
| 550 |
+
LABEL_0: 0
|
| 551 |
+
LABEL_1: 1
|
| 552 |
+
learning_rate:
|
| 553 |
+
value: 5e-05
|
| 554 |
+
length_column_name:
|
| 555 |
+
value: length
|
| 556 |
+
length_penalty:
|
| 557 |
+
value: 1
|
| 558 |
+
liger_kernel_config:
|
| 559 |
+
value: null
|
| 560 |
+
lisa_activated_layers:
|
| 561 |
+
value: 0
|
| 562 |
+
lisa_step_interval:
|
| 563 |
+
value: 20
|
| 564 |
+
load_best_model_at_end:
|
| 565 |
+
value: false
|
| 566 |
+
local_rank:
|
| 567 |
+
value: 0
|
| 568 |
+
log_completions:
|
| 569 |
+
value: true
|
| 570 |
+
log_completions_hub_repo:
|
| 571 |
+
value: null
|
| 572 |
+
log_entropy:
|
| 573 |
+
value: false
|
| 574 |
+
log_level:
|
| 575 |
+
value: passive
|
| 576 |
+
log_level_replica:
|
| 577 |
+
value: warning
|
| 578 |
+
log_on_each_node:
|
| 579 |
+
value: true
|
| 580 |
+
log_rollout_offpolicy_metrics:
|
| 581 |
+
value: false
|
| 582 |
+
log_unique_prompts:
|
| 583 |
+
value: false
|
| 584 |
+
logging_dir:
|
| 585 |
+
value: /mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/0416upload/out/qwen3asr_dapo_reward56_4x4x12_12gen_4GPU/v5-20260418-172837/runs
|
| 586 |
+
logging_first_step:
|
| 587 |
+
value: true
|
| 588 |
+
logging_nan_inf_filter:
|
| 589 |
+
value: true
|
| 590 |
+
logging_steps:
|
| 591 |
+
value: 5
|
| 592 |
+
logging_strategy:
|
| 593 |
+
value: steps
|
| 594 |
+
lora_rank:
|
| 595 |
+
value: 8
|
| 596 |
+
loss_type:
|
| 597 |
+
value: dapo
|
| 598 |
+
lr_scheduler_kwargs:
|
| 599 |
+
value: null
|
| 600 |
+
lr_scheduler_type:
|
| 601 |
+
value: cosine
|
| 602 |
+
mask_truncated_completions:
|
| 603 |
+
value: false
|
| 604 |
+
max_completion_length:
|
| 605 |
+
value: 256
|
| 606 |
+
max_epochs:
|
| 607 |
+
value: null
|
| 608 |
+
max_grad_norm:
|
| 609 |
+
value: 1
|
| 610 |
+
max_length:
|
| 611 |
+
value: 20
|
| 612 |
+
max_resample_times:
|
| 613 |
+
value: 4
|
| 614 |
+
max_shard_size:
|
| 615 |
+
value: 5GB
|
| 616 |
+
max_steps:
|
| 617 |
+
value: -1
|
| 618 |
+
max_tool_calling_iterations:
|
| 619 |
+
value: null
|
| 620 |
+
max_turns:
|
| 621 |
+
value: null
|
| 622 |
+
metric_for_best_model:
|
| 623 |
+
value: loss
|
| 624 |
+
min_length:
|
| 625 |
+
value: 0
|
| 626 |
+
min_p:
|
| 627 |
+
value: null
|
| 628 |
+
model/num_parameters:
|
| 629 |
+
value: 2050307712
|
| 630 |
+
model_init_kwargs:
|
| 631 |
+
value: null
|
| 632 |
+
model_type:
|
| 633 |
+
value: qwen3_asr
|
| 634 |
+
move_model_batches:
|
| 635 |
+
value: null
|
| 636 |
+
mp_parameters:
|
| 637 |
+
value: ""
|
| 638 |
+
multi_objective_aggregation:
|
| 639 |
+
value: sum_then_normalize
|
| 640 |
+
multi_turn_scheduler:
|
| 641 |
+
value: null
|
| 642 |
+
neftune_noise_alpha:
|
| 643 |
+
value: null
|
| 644 |
+
no_cuda:
|
| 645 |
+
value: false
|
| 646 |
+
no_repeat_ngram_size:
|
| 647 |
+
value: 0
|
| 648 |
+
num_beam_groups:
|
| 649 |
+
value: 1
|
| 650 |
+
num_beams:
|
| 651 |
+
value: 1
|
| 652 |
+
num_completions_to_print:
|
| 653 |
+
value: null
|
| 654 |
+
num_generations:
|
| 655 |
+
value: 12
|
| 656 |
+
num_generations_eval:
|
| 657 |
+
value: 4
|
| 658 |
+
num_iterations:
|
| 659 |
+
value: 2
|
| 660 |
+
num_return_sequences:
|
| 661 |
+
value: 1
|
| 662 |
+
num_train_epochs:
|
| 663 |
+
value: 3
|
| 664 |
+
off_policy_mask_threshold:
|
| 665 |
+
value: null
|
| 666 |
+
off_policy_sequence_mask_delta:
|
| 667 |
+
value: null
|
| 668 |
+
offload_model:
|
| 669 |
+
value: false
|
| 670 |
+
offload_optimizer:
|
| 671 |
+
value: false
|
| 672 |
+
optim:
|
| 673 |
+
value: adamw_torch
|
| 674 |
+
optim_args:
|
| 675 |
+
value: null
|
| 676 |
+
optim_target_modules:
|
| 677 |
+
value: null
|
| 678 |
+
optimizer:
|
| 679 |
+
value: null
|
| 680 |
+
output_attentions:
|
| 681 |
+
value: false
|
| 682 |
+
output_dir:
|
| 683 |
+
value: /mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/0416upload/out/qwen3asr_dapo_reward56_4x4x12_12gen_4GPU/v5-20260418-172837
|
| 684 |
+
output_hidden_states:
|
| 685 |
+
value: false
|
| 686 |
+
output_scores:
|
| 687 |
+
value: false
|
| 688 |
+
overlong_filter:
|
| 689 |
+
value: true
|
| 690 |
+
overwrite_output_dir:
|
| 691 |
+
value: false
|
| 692 |
+
pad_token_id:
|
| 693 |
+
value: 151643
|
| 694 |
+
parallelism_config:
|
| 695 |
+
value: null
|
| 696 |
+
past_index:
|
| 697 |
+
value: -1
|
| 698 |
+
peft_config:
|
| 699 |
+
value:
|
| 700 |
+
default:
|
| 701 |
+
alora_invocation_tokens: null
|
| 702 |
+
arrow_config: null
|
| 703 |
+
auto_mapping: null
|
| 704 |
+
base_model_name_or_path: /mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/qwen3-asr-merged
|
| 705 |
+
bias: none
|
| 706 |
+
corda_config: null
|
| 707 |
+
ensure_weight_tying: false
|
| 708 |
+
eva_config: null
|
| 709 |
+
exclude_modules: null
|
| 710 |
+
fan_in_fan_out: false
|
| 711 |
+
inference_mode: false
|
| 712 |
+
init_lora_weights: true
|
| 713 |
+
layer_replication: null
|
| 714 |
+
layers_pattern: null
|
| 715 |
+
layers_to_transform: null
|
| 716 |
+
lora_alpha: 32
|
| 717 |
+
lora_bias: false
|
| 718 |
+
lora_dropout: 0.05
|
| 719 |
+
lora_dtype: null
|
| 720 |
+
lorap_emb_lr: 1e-06
|
| 721 |
+
lorap_lr_ratio: null
|
| 722 |
+
megatron_config: null
|
| 723 |
+
megatron_core: megatron.core
|
| 724 |
+
modules_to_save: []
|
| 725 |
+
peft_type: LORA
|
| 726 |
+
peft_version: 0.18.1
|
| 727 |
+
qalora_group_size: 16
|
| 728 |
+
r: 8
|
| 729 |
+
revision: null
|
| 730 |
+
runtime_config:
|
| 731 |
+
ephemeral_gpu_offload: false
|
| 732 |
+
target_modules: ^(thinker\.model(?=\.).*\.(up_proj|q_proj|o_proj|gate_proj|k_proj|v_proj|down_proj)|thinker\.audio_tower\.layers(?=\.).*\.(q_proj|fc1|out_proj|k_proj|v_proj|fc2)|thinker\.audio_tower\.conv_out(?=\.)|thinker\.audio_tower\.proj1(?=\.)|thinker\.audio_tower\.proj2(?=\.))$
|
| 733 |
+
target_parameters: null
|
| 734 |
+
task_type: CAUSAL_LM
|
| 735 |
+
trainable_token_indices: null
|
| 736 |
+
use_dora: false
|
| 737 |
+
use_qalora: false
|
| 738 |
+
use_rslora: false
|
| 739 |
+
per_device_eval_batch_size:
|
| 740 |
+
value: 4
|
| 741 |
+
per_device_train_batch_size:
|
| 742 |
+
value: 4
|
| 743 |
+
per_gpu_eval_batch_size:
|
| 744 |
+
value: null
|
| 745 |
+
per_gpu_train_batch_size:
|
| 746 |
+
value: null
|
| 747 |
+
prediction_loss_only:
|
| 748 |
+
value: false
|
| 749 |
+
prefix:
|
| 750 |
+
value: null
|
| 751 |
+
problem_type:
|
| 752 |
+
value: null
|
| 753 |
+
project:
|
| 754 |
+
value: huggingface
|
| 755 |
+
push_to_hub:
|
| 756 |
+
value: false
|
| 757 |
+
push_to_hub_model_id:
|
| 758 |
+
value: null
|
| 759 |
+
push_to_hub_organization:
|
| 760 |
+
value: null
|
| 761 |
+
push_to_hub_token:
|
| 762 |
+
value: <PUSH_TO_HUB_TOKEN>
|
| 763 |
+
ray_scope:
|
| 764 |
+
value: last
|
| 765 |
+
ref_model_mixup_alpha:
|
| 766 |
+
value: 0.6
|
| 767 |
+
ref_model_sync_steps:
|
| 768 |
+
value: 512
|
| 769 |
+
remove_invalid_values:
|
| 770 |
+
value: false
|
| 771 |
+
remove_unused_columns:
|
| 772 |
+
value: false
|
| 773 |
+
repetition_max_penalty:
|
| 774 |
+
value: -1
|
| 775 |
+
repetition_n_grams:
|
| 776 |
+
value: 3
|
| 777 |
+
repetition_penalty:
|
| 778 |
+
value: 1.08
|
| 779 |
+
report_to:
|
| 780 |
+
value:
|
| 781 |
+
- wandb
|
| 782 |
+
restore_callback_states_from_checkpoint:
|
| 783 |
+
value: false
|
| 784 |
+
resume_from_checkpoint:
|
| 785 |
+
value: null
|
| 786 |
+
resume_only_model:
|
| 787 |
+
value: false
|
| 788 |
+
return_dict:
|
| 789 |
+
value: true
|
| 790 |
+
return_dict_in_generate:
|
| 791 |
+
value: false
|
| 792 |
+
reward_model:
|
| 793 |
+
value: null
|
| 794 |
+
reward_model_plugin:
|
| 795 |
+
value: null
|
| 796 |
+
reward_weights:
|
| 797 |
+
value: null
|
| 798 |
+
rollout_importance_sampling_mode:
|
| 799 |
+
value: null
|
| 800 |
+
rollout_importance_sampling_threshold:
|
| 801 |
+
value: 2
|
| 802 |
+
router_aux_loss_coef:
|
| 803 |
+
value: 0
|
| 804 |
+
run_name:
|
| 805 |
+
value: qwen3asr_dapo_reward56_4x4x12_12gen_4GPU
|
| 806 |
+
safe_serialization:
|
| 807 |
+
value: true
|
| 808 |
+
sapo_temperature_neg:
|
| 809 |
+
value: 1.05
|
| 810 |
+
sapo_temperature_pos:
|
| 811 |
+
value: 1
|
| 812 |
+
save_on_each_node:
|
| 813 |
+
value: false
|
| 814 |
+
save_only_model:
|
| 815 |
+
value: false
|
| 816 |
+
save_safetensors:
|
| 817 |
+
value: true
|
| 818 |
+
save_steps:
|
| 819 |
+
value: 20
|
| 820 |
+
save_strategy:
|
| 821 |
+
value: steps
|
| 822 |
+
save_total_limit:
|
| 823 |
+
value: null
|
| 824 |
+
scale_rewards:
|
| 825 |
+
value: group
|
| 826 |
+
seed:
|
| 827 |
+
value: 42
|
| 828 |
+
sep_token_id:
|
| 829 |
+
value: null
|
| 830 |
+
shuffle_dataset:
|
| 831 |
+
value: true
|
| 832 |
+
skip_memory_metrics:
|
| 833 |
+
value: true
|
| 834 |
+
sleep_level:
|
| 835 |
+
value: 0
|
| 836 |
+
soft_cache_length:
|
| 837 |
+
value: null
|
| 838 |
+
soft_max_length:
|
| 839 |
+
value: null
|
| 840 |
+
steps_per_generation:
|
| 841 |
+
value: 3
|
| 842 |
+
stop_words:
|
| 843 |
+
value: []
|
| 844 |
+
structured_outputs_regex:
|
| 845 |
+
value: null
|
| 846 |
+
support_languages:
|
| 847 |
+
value:
|
| 848 |
+
- Chinese
|
| 849 |
+
- English
|
| 850 |
+
- Cantonese
|
| 851 |
+
- Arabic
|
| 852 |
+
- German
|
| 853 |
+
- French
|
| 854 |
+
- Spanish
|
| 855 |
+
- Portuguese
|
| 856 |
+
- Indonesian
|
| 857 |
+
- Italian
|
| 858 |
+
- Korean
|
| 859 |
+
- Russian
|
| 860 |
+
- Thai
|
| 861 |
+
- Vietnamese
|
| 862 |
+
- Japanese
|
| 863 |
+
- Turkish
|
| 864 |
+
- Hindi
|
| 865 |
+
- Malay
|
| 866 |
+
- Dutch
|
| 867 |
+
- Swedish
|
| 868 |
+
- Danish
|
| 869 |
+
- Finnish
|
| 870 |
+
- Polish
|
| 871 |
+
- Czech
|
| 872 |
+
- Filipino
|
| 873 |
+
- Persian
|
| 874 |
+
- Greek
|
| 875 |
+
- Romanian
|
| 876 |
+
- Hungarian
|
| 877 |
+
- Macedonian
|
| 878 |
+
suppress_tokens:
|
| 879 |
+
value: null
|
| 880 |
+
sync_ref_model:
|
| 881 |
+
value: false
|
| 882 |
+
task_specific_params:
|
| 883 |
+
value: null
|
| 884 |
+
tau_neg:
|
| 885 |
+
value: 1.05
|
| 886 |
+
tau_pos:
|
| 887 |
+
value: 1
|
| 888 |
+
temperature:
|
| 889 |
+
value: 0.5
|
| 890 |
+
tf_legacy_loss:
|
| 891 |
+
value: false
|
| 892 |
+
tf32:
|
| 893 |
+
value: null
|
| 894 |
+
thinker_config:
|
| 895 |
+
value:
|
| 896 |
+
_name_or_path: ""
|
| 897 |
+
add_cross_attention: false
|
| 898 |
+
architectures:
|
| 899 |
+
- Qwen3ASRForConditionalGeneration
|
| 900 |
+
audio_config:
|
| 901 |
+
_name_or_path: ""
|
| 902 |
+
activation_dropout: 0
|
| 903 |
+
activation_function: gelu
|
| 904 |
+
add_cross_attention: false
|
| 905 |
+
architectures: null
|
| 906 |
+
attention_dropout: 0
|
| 907 |
+
bad_words_ids: null
|
| 908 |
+
begin_suppress_tokens: null
|
| 909 |
+
bos_token_id: null
|
| 910 |
+
chunk_size_feed_forward: 0
|
| 911 |
+
conv_chunksize: 500
|
| 912 |
+
cross_attention_hidden_size: null
|
| 913 |
+
d_model: 1024
|
| 914 |
+
decoder_start_token_id: null
|
| 915 |
+
diversity_penalty: 0
|
| 916 |
+
do_sample: false
|
| 917 |
+
downsample_hidden_size: 480
|
| 918 |
+
dropout: 0
|
| 919 |
+
dtype: null
|
| 920 |
+
early_stopping: false
|
| 921 |
+
encoder_attention_heads: 16
|
| 922 |
+
encoder_ffn_dim: 4096
|
| 923 |
+
encoder_layers: 24
|
| 924 |
+
encoder_no_repeat_ngram_size: 0
|
| 925 |
+
eos_token_id: null
|
| 926 |
+
exponential_decay_length_penalty: null
|
| 927 |
+
finetuning_task: null
|
| 928 |
+
forced_bos_token_id: null
|
| 929 |
+
forced_eos_token_id: null
|
| 930 |
+
id2label:
|
| 931 |
+
"0": LABEL_0
|
| 932 |
+
"1": LABEL_1
|
| 933 |
+
initializer_range: 0.02
|
| 934 |
+
is_decoder: false
|
| 935 |
+
is_encoder_decoder: false
|
| 936 |
+
label2id:
|
| 937 |
+
LABEL_0: 0
|
| 938 |
+
LABEL_1: 1
|
| 939 |
+
length_penalty: 1
|
| 940 |
+
max_length: 20
|
| 941 |
+
max_source_positions: 1500
|
| 942 |
+
min_length: 0
|
| 943 |
+
model_type: qwen3_asr_audio_encoder
|
| 944 |
+
n_window: 50
|
| 945 |
+
n_window_infer: 800
|
| 946 |
+
no_repeat_ngram_size: 0
|
| 947 |
+
num_beam_groups: 1
|
| 948 |
+
num_beams: 1
|
| 949 |
+
num_hidden_layers: 24
|
| 950 |
+
num_mel_bins: 128
|
| 951 |
+
num_return_sequences: 1
|
| 952 |
+
output_attentions: false
|
| 953 |
+
output_dim: 2048
|
| 954 |
+
output_hidden_states: false
|
| 955 |
+
output_scores: false
|
| 956 |
+
pad_token_id: null
|
| 957 |
+
prefix: null
|
| 958 |
+
problem_type: null
|
| 959 |
+
remove_invalid_values: false
|
| 960 |
+
repetition_penalty: 1
|
| 961 |
+
return_dict: true
|
| 962 |
+
return_dict_in_generate: false
|
| 963 |
+
scale_embedding: false
|
| 964 |
+
sep_token_id: null
|
| 965 |
+
suppress_tokens: null
|
| 966 |
+
task_specific_params: null
|
| 967 |
+
temperature: 1
|
| 968 |
+
tf_legacy_loss: false
|
| 969 |
+
tie_encoder_decoder: false
|
| 970 |
+
tie_word_embeddings: true
|
| 971 |
+
tokenizer_class: null
|
| 972 |
+
top_k: 50
|
| 973 |
+
top_p: 1
|
| 974 |
+
torchscript: false
|
| 975 |
+
typical_p: 1
|
| 976 |
+
use_bfloat16: false
|
| 977 |
+
audio_end_token_id: 151670
|
| 978 |
+
audio_start_token_id: 151669
|
| 979 |
+
audio_token_id: 151676
|
| 980 |
+
bad_words_ids: null
|
| 981 |
+
begin_suppress_tokens: null
|
| 982 |
+
bos_token_id: null
|
| 983 |
+
chunk_size_feed_forward: 0
|
| 984 |
+
cross_attention_hidden_size: null
|
| 985 |
+
decoder_start_token_id: null
|
| 986 |
+
diversity_penalty: 0
|
| 987 |
+
do_sample: false
|
| 988 |
+
dtype: bfloat16
|
| 989 |
+
early_stopping: false
|
| 990 |
+
encoder_no_repeat_ngram_size: 0
|
| 991 |
+
eos_token_id: null
|
| 992 |
+
exponential_decay_length_penalty: null
|
| 993 |
+
finetuning_task: null
|
| 994 |
+
forced_bos_token_id: null
|
| 995 |
+
forced_eos_token_id: null
|
| 996 |
+
id2label:
|
| 997 |
+
"0": LABEL_0
|
| 998 |
+
"1": LABEL_1
|
| 999 |
+
initializer_range: 0.02
|
| 1000 |
+
is_decoder: false
|
| 1001 |
+
is_encoder_decoder: false
|
| 1002 |
+
label2id:
|
| 1003 |
+
LABEL_0: 0
|
| 1004 |
+
LABEL_1: 1
|
| 1005 |
+
length_penalty: 1
|
| 1006 |
+
max_length: 20
|
| 1007 |
+
min_length: 0
|
| 1008 |
+
model_type: qwen3_asr_thinker
|
| 1009 |
+
no_repeat_ngram_size: 0
|
| 1010 |
+
num_beam_groups: 1
|
| 1011 |
+
num_beams: 1
|
| 1012 |
+
num_return_sequences: 1
|
| 1013 |
+
output_attentions: false
|
| 1014 |
+
output_hidden_states: false
|
| 1015 |
+
output_scores: false
|
| 1016 |
+
pad_token_id: null
|
| 1017 |
+
prefix: null
|
| 1018 |
+
problem_type: null
|
| 1019 |
+
remove_invalid_values: false
|
| 1020 |
+
repetition_penalty: 1
|
| 1021 |
+
return_dict: true
|
| 1022 |
+
return_dict_in_generate: false
|
| 1023 |
+
sep_token_id: null
|
| 1024 |
+
suppress_tokens: null
|
| 1025 |
+
task_specific_params: null
|
| 1026 |
+
temperature: 1
|
| 1027 |
+
text_config:
|
| 1028 |
+
_name_or_path: ""
|
| 1029 |
+
add_cross_attention: false
|
| 1030 |
+
architectures: null
|
| 1031 |
+
attention_bias: false
|
| 1032 |
+
attention_dropout: 0
|
| 1033 |
+
bad_words_ids: null
|
| 1034 |
+
begin_suppress_tokens: null
|
| 1035 |
+
bos_token_id: null
|
| 1036 |
+
chunk_size_feed_forward: 0
|
| 1037 |
+
cross_attention_hidden_size: null
|
| 1038 |
+
decoder_start_token_id: null
|
| 1039 |
+
diversity_penalty: 0
|
| 1040 |
+
do_sample: false
|
| 1041 |
+
dtype: null
|
| 1042 |
+
early_stopping: false
|
| 1043 |
+
encoder_no_repeat_ngram_size: 0
|
| 1044 |
+
eos_token_id: null
|
| 1045 |
+
exponential_decay_length_penalty: null
|
| 1046 |
+
finetuning_task: null
|
| 1047 |
+
forced_bos_token_id: null
|
| 1048 |
+
forced_eos_token_id: null
|
| 1049 |
+
head_dim: 128
|
| 1050 |
+
hidden_act: silu
|
| 1051 |
+
hidden_size: 2048
|
| 1052 |
+
id2label:
|
| 1053 |
+
"0": LABEL_0
|
| 1054 |
+
"1": LABEL_1
|
| 1055 |
+
initializer_range: 0.02
|
| 1056 |
+
intermediate_size: 6144
|
| 1057 |
+
is_decoder: false
|
| 1058 |
+
is_encoder_decoder: false
|
| 1059 |
+
label2id:
|
| 1060 |
+
LABEL_0: 0
|
| 1061 |
+
LABEL_1: 1
|
| 1062 |
+
length_penalty: 1
|
| 1063 |
+
max_length: 20
|
| 1064 |
+
max_position_embeddings: 65536
|
| 1065 |
+
min_length: 0
|
| 1066 |
+
model_type: qwen3_asr_text
|
| 1067 |
+
no_repeat_ngram_size: 0
|
| 1068 |
+
num_attention_heads: 16
|
| 1069 |
+
num_beam_groups: 1
|
| 1070 |
+
num_beams: 1
|
| 1071 |
+
num_hidden_layers: 28
|
| 1072 |
+
num_key_value_heads: 8
|
| 1073 |
+
num_return_sequences: 1
|
| 1074 |
+
output_attentions: false
|
| 1075 |
+
output_hidden_states: false
|
| 1076 |
+
output_scores: false
|
| 1077 |
+
pad_token_id: 151643
|
| 1078 |
+
prefix: null
|
| 1079 |
+
problem_type: null
|
| 1080 |
+
remove_invalid_values: false
|
| 1081 |
+
repetition_penalty: 1
|
| 1082 |
+
return_dict: true
|
| 1083 |
+
return_dict_in_generate: false
|
| 1084 |
+
rms_norm_eps: 1e-06
|
| 1085 |
+
rope_scaling:
|
| 1086 |
+
interleaved: true
|
| 1087 |
+
mrope_interleaved: true
|
| 1088 |
+
mrope_section:
|
| 1089 |
+
- 24
|
| 1090 |
+
- 20
|
| 1091 |
+
- 20
|
| 1092 |
+
rope_type: default
|
| 1093 |
+
type: default
|
| 1094 |
+
rope_theta: 1000000
|
| 1095 |
+
sep_token_id: null
|
| 1096 |
+
suppress_tokens: null
|
| 1097 |
+
task_specific_params: null
|
| 1098 |
+
temperature: 1
|
| 1099 |
+
tf_legacy_loss: false
|
| 1100 |
+
tie_encoder_decoder: false
|
| 1101 |
+
tie_word_embeddings: true
|
| 1102 |
+
tokenizer_class: null
|
| 1103 |
+
top_k: 50
|
| 1104 |
+
top_p: 1
|
| 1105 |
+
torchscript: false
|
| 1106 |
+
typical_p: 1
|
| 1107 |
+
use_bfloat16: false
|
| 1108 |
+
use_cache: false
|
| 1109 |
+
vocab_size: 151936
|
| 1110 |
+
tf_legacy_loss: false
|
| 1111 |
+
tie_encoder_decoder: false
|
| 1112 |
+
tie_word_embeddings: true
|
| 1113 |
+
tokenizer_class: null
|
| 1114 |
+
top_k: 50
|
| 1115 |
+
top_p: 1
|
| 1116 |
+
torchscript: false
|
| 1117 |
+
typical_p: 1
|
| 1118 |
+
use_bfloat16: false
|
| 1119 |
+
user_token_id: 872
|
| 1120 |
+
tie_encoder_decoder:
|
| 1121 |
+
value: false
|
| 1122 |
+
tie_word_embeddings:
|
| 1123 |
+
value: true
|
| 1124 |
+
tokenizer_class:
|
| 1125 |
+
value: null
|
| 1126 |
+
top_entropy_quantile:
|
| 1127 |
+
value: 1
|
| 1128 |
+
top_k:
|
| 1129 |
+
value: 50
|
| 1130 |
+
top_p:
|
| 1131 |
+
value: 0.95
|
| 1132 |
+
torch_compile:
|
| 1133 |
+
value: false
|
| 1134 |
+
torch_compile_backend:
|
| 1135 |
+
value: null
|
| 1136 |
+
torch_compile_mode:
|
| 1137 |
+
value: null
|
| 1138 |
+
torch_empty_cache_steps:
|
| 1139 |
+
value: null
|
| 1140 |
+
torchdynamo:
|
| 1141 |
+
value: null
|
| 1142 |
+
torchscript:
|
| 1143 |
+
value: false
|
| 1144 |
+
tpu_metrics_debug:
|
| 1145 |
+
value: false
|
| 1146 |
+
tpu_num_cores:
|
| 1147 |
+
value: null
|
| 1148 |
+
trackio_space_id:
|
| 1149 |
+
value: trackio
|
| 1150 |
+
train_dataloader_shuffle:
|
| 1151 |
+
value: true
|
| 1152 |
+
transformers_version:
|
| 1153 |
+
value: 4.57.6
|
| 1154 |
+
tuner_backend:
|
| 1155 |
+
value: peft
|
| 1156 |
+
tuner_type:
|
| 1157 |
+
value: lora
|
| 1158 |
+
typical_p:
|
| 1159 |
+
value: 1
|
| 1160 |
+
use_bfloat16:
|
| 1161 |
+
value: false
|
| 1162 |
+
use_bias_correction_kl:
|
| 1163 |
+
value: false
|
| 1164 |
+
use_cpu:
|
| 1165 |
+
value: false
|
| 1166 |
+
use_flash_ckpt:
|
| 1167 |
+
value: false
|
| 1168 |
+
use_galore:
|
| 1169 |
+
value: false
|
| 1170 |
+
use_legacy_prediction_loop:
|
| 1171 |
+
value: false
|
| 1172 |
+
use_liger_kernel:
|
| 1173 |
+
value: false
|
| 1174 |
+
use_logits_to_keep:
|
| 1175 |
+
value: null
|
| 1176 |
+
use_mps_device:
|
| 1177 |
+
value: false
|
| 1178 |
+
use_transformers_paged:
|
| 1179 |
+
value: false
|
| 1180 |
+
use_vllm:
|
| 1181 |
+
value: false
|
| 1182 |
+
vit_gradient_checkpointing:
|
| 1183 |
+
value: true
|
| 1184 |
+
vit_lr:
|
| 1185 |
+
value: null
|
| 1186 |
+
vllm_data_parallel_size:
|
| 1187 |
+
value: 1
|
| 1188 |
+
vllm_disable_cascade_attn:
|
| 1189 |
+
value: false
|
| 1190 |
+
vllm_disable_custom_all_reduce:
|
| 1191 |
+
value: true
|
| 1192 |
+
vllm_enable_expert_parallel:
|
| 1193 |
+
value: false
|
| 1194 |
+
vllm_enable_lora:
|
| 1195 |
+
value: false
|
| 1196 |
+
vllm_enable_prefix_caching:
|
| 1197 |
+
value: true
|
| 1198 |
+
vllm_enable_sleep_mode:
|
| 1199 |
+
value: false
|
| 1200 |
+
vllm_enforce_eager:
|
| 1201 |
+
value: false
|
| 1202 |
+
vllm_gpu_memory_utilization:
|
| 1203 |
+
value: 0.9
|
| 1204 |
+
vllm_group_port:
|
| 1205 |
+
value: 51216
|
| 1206 |
+
vllm_importance_sampling_cap:
|
| 1207 |
+
value: 3
|
| 1208 |
+
vllm_importance_sampling_correction:
|
| 1209 |
+
value: true
|
| 1210 |
+
vllm_importance_sampling_mode:
|
| 1211 |
+
value: sequence_mask
|
| 1212 |
+
vllm_limit_mm_per_prompt:
|
| 1213 |
+
value: null
|
| 1214 |
+
vllm_max_lora_rank:
|
| 1215 |
+
value: 16
|
| 1216 |
+
vllm_max_model_len:
|
| 1217 |
+
value: null
|
| 1218 |
+
vllm_max_model_length:
|
| 1219 |
+
value: null
|
| 1220 |
+
vllm_max_num_seqs:
|
| 1221 |
+
value: null
|
| 1222 |
+
vllm_mm_processor_cache_gb:
|
| 1223 |
+
value: null
|
| 1224 |
+
vllm_mode:
|
| 1225 |
+
value: null
|
| 1226 |
+
vllm_model_impl:
|
| 1227 |
+
value: vllm
|
| 1228 |
+
vllm_pipeline_parallel_size:
|
| 1229 |
+
value: 1
|
| 1230 |
+
vllm_quantization:
|
| 1231 |
+
value: null
|
| 1232 |
+
vllm_reasoning_parser:
|
| 1233 |
+
value: null
|
| 1234 |
+
vllm_server_base_url:
|
| 1235 |
+
value: null
|
| 1236 |
+
vllm_server_group_port:
|
| 1237 |
+
value: null
|
| 1238 |
+
vllm_server_host:
|
| 1239 |
+
value: null
|
| 1240 |
+
vllm_server_pass_dataset:
|
| 1241 |
+
value: false
|
| 1242 |
+
vllm_server_port:
|
| 1243 |
+
value:
|
| 1244 |
+
- 8000
|
| 1245 |
+
vllm_server_timeout:
|
| 1246 |
+
value: 240
|
| 1247 |
+
vllm_speculative_config:
|
| 1248 |
+
value: null
|
| 1249 |
+
vllm_structured_outputs_regex:
|
| 1250 |
+
value: null
|
| 1251 |
+
vllm_tensor_parallel_size:
|
| 1252 |
+
value: 1
|
| 1253 |
+
vllm_use_async_engine:
|
| 1254 |
+
value: null
|
| 1255 |
+
wandb_log_unique_prompts:
|
| 1256 |
+
value: null
|
| 1257 |
+
warmup_ratio:
|
| 1258 |
+
value: 0.03
|
| 1259 |
+
warmup_steps:
|
| 1260 |
+
value: 0
|
| 1261 |
+
weight_decay:
|
| 1262 |
+
value: 0.1
|
wandb/run-20260418_172847-c2a5hfz3/files/media/table/completions_291_2ce0194cf48cadccd2a9.table.json
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"columns": ["step", "prompt", "completion", "ASRWerSubLenCmpHalluDirtyV56", "advantages", "solution"], "data": [["580", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Captain markham, it's about about my wife. Polly answered, casting down her eyes and returning a very red. The other day, the whistle.<|im_end|>", 0.1822807341814041, -0.8288241028785706, "Captain marker, it's about about my wife. Crawley answered, casting down his eyes and turning very red. The other gave a whistle."], ["580", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Captain marten, it's about about my wife. Crawley answered, casting down his eyes and returning very red. The other gave a whistle.<|im_end|>", 0.7842410206794739, 1.4543499946594238, "Captain marker, it's about about my wife. Crawley answered, casting down his eyes and turning very red. The other gave a whistle."], ["580", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Captain knocker, it's about about my wife. Crawley answered, casting down his eyes and returning a very red the other day, the whistle.<|im_end|>", 0.31845957040786743, -0.31231164932250977, "Captain marker, it's about about my wife. Crawley answered, casting down his eyes and turning very red. The other gave a whistle."], ["580", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Captain Markham, it's about about my wife, Crawley answered, casting down his eyes and returning a very red. The other day, the whistle.<|im_end|>", 0.3182216286659241, -0.31321415305137634, "Captain marker, it's about about my wife. Crawley answered, casting down his eyes and turning very red. The other gave a whistle."], ["580", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>At evening upon the world, while others hint that knowledge of these might undo our civilization. There watched him ceaselessly from the under pits those eyes whose duty it is from further within and deeper.<|im_end|>", 0.8666909337043762, 0.20433472096920013, "At evening upon the world, while others hint that knowledge of these might undo our civilization, there watched him ceaselessly from the under pits, those eyes whose duty it is from further within and deeper."], ["580", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>At evening upon the world, while others hint that knowledge of these might undo our civilization, there watched him ceaselessly from the underpits those eyes whose duty it is, from further within and deeper.<|im_end|>", 0.8165187239646912, -0.6340823769569397, "At evening upon the world, while others hint that knowledge of these might undo our civilization, there watched him ceaselessly from the under pits, those eyes whose duty it is from further within and deeper."], ["580", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>At evening upon the world, while others hint that knowledge of these might undo our civilization, there watched him ceaselessly from the under pits those eyes whose duty it is from further within and deeper.<|im_end|>", 0.9336058497428894, 1.3225356340408325, "At evening upon the world, while others hint that knowledge of these might undo our civilization, there watched him ceaselessly from the under pits, those eyes whose duty it is from further within and deeper."], ["580", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>At evening upon the world, while others hint that knowledge of these might undo our civilization. There watched him ceaselessly from the under pits those eyes whose duty it is, from further within and deeper.<|im_end|>", 0.8010374307632446, -0.8927869200706482, "At evening upon the world, while others hint that knowledge of these might undo our civilization, there watched him ceaselessly from the under pits, those eyes whose duty it is from further within and deeper."], ["580", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Milly steered her magnificent way like some great liner cleaving among the canoes of howling savages. Our goddess of grub was built on lines so majestic that they could be followed only with awe.<|im_end|>", 1.0, 0.0, "Milly steered her magnificent way like some great liner cleaving among the canoes of howling savages. Our goddess of grub was built on lines so majestic that they could be followed only with awe."], ["580", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Milly steered her magnificent way like some great liner cleaving among the canoes of howling savages. Our goddess of grub was built on lines so majestic that they could be followed only with awe.<|im_end|>", 1.0, 0.0, "Milly steered her magnificent way like some great liner cleaving among the canoes of howling savages. Our goddess of grub was built on lines so majestic that they could be followed only with awe."], ["580", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Milly steered her magnificent way like some great liner cleaving among the canoes of howling savages. Our goddess of grub was built on lines so majestic that they could be followed only with awe.<|im_end|>", 1.0, 0.0, "Milly steered her magnificent way like some great liner cleaving among the canoes of howling savages. Our goddess of grub was built on lines so majestic that they could be followed only with awe."], ["580", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Milly steered her magnificent way like some great liner cleaving among the canoes of howling savages. Our goddess of grub was built on lines so majestic that they could be followed only with awe.<|im_end|>", 1.0, 0.0, "Milly steered her magnificent way like some great liner cleaving among the canoes of howling savages. Our goddess of grub was built on lines so majestic that they could be followed only with awe."], ["580", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>And made properly lavish time out of working time. It is not improbable that glossy buttons are a valid feature in the garb of a humdrum and harassed hospital porter. Many intellect.<|im_end|>", 0.11065644025802612, 0.8317853212356567, "And may properly lavish time and trouble thereupon. It is not arguable that glossy buttons are a valid feature of the garb of a humdrum and harassed hospital, orderly many a time."], ["580", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>And may properly lavish time and sport in a pantomime. It is not improbable that glossy buttons are a valid feature of the garb for humdrum and grassy hospitals, or more many intellect.<|im_end|>", -0.05923449248075485, -1.18646240234375, "And may properly lavish time and trouble thereupon. It is not arguable that glossy buttons are a valid feature of the garb of a humdrum and harassed hospital, orderly many a time."], ["580", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>And make properly lavish time out of working time. It is not improbable that glossy buttons are a valid feature in the garb of a humdrum and harassed hospital porter. Many intellect.<|im_end|>", 0.10980796068906784, 0.82170569896698, "And may properly lavish time and trouble thereupon. It is not arguable that glossy buttons are a valid feature of the garb of a humdrum and harassed hospital, orderly many a time."], ["580", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>And may properly lavish time after working upon it is not remarkable that glossy buttons are a valid feature of the garb for humdrum and grassy hospitals or more many intellect.<|im_end|>", 0.0013256088132038713, -0.46702858805656433, "And may properly lavish time and trouble thereupon. It is not arguable that glossy buttons are a valid feature of the garb of a humdrum and harassed hospital, orderly many a time."], ["580", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>And Shahrazad perceived the dawn of day and ceased saying her permitted say when it was the six hundred and seventy seventh night, she pursued it hath reached me o auspicious king that when the kafirs fell upon harib.<|im_end|>", 0.7613571882247925, 1.3583694696426392, "And shahrazad perceived the dawn of day and ceased saying her permitted say. When it was the six hundred and seventy seventh night, she pursued it. Hath reached me o auspicious king, that when the kafirs fell upon gharib."], ["580", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>And Shahrazad perceived the dawn of day and ceased saying her permitted say, when it was the six hundred and seventy seventh night. She pursued, it hath reached me, O auspicious king, that when the kaffirs fell upon Harib.<|im_end|>", 0.5681424736976624, -1.0484904050827026, "And shahrazad perceived the dawn of day and ceased saying her permitted say. When it was the six hundred and seventy seventh night, she pursued it. Hath reached me o auspicious king, that when the kafirs fell upon gharib."], ["580", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>And Shahrazad perceived the dawn of day and ceased saying her permitted say when it was the six hundred and seventy seventh night she pursued, it hath reached me o auspicious king that when the kafirs fell upon Harib.<|im_end|>", 0.6401126384735107, -0.1519639790058136, "And shahrazad perceived the dawn of day and ceased saying her permitted say. When it was the six hundred and seventy seventh night, she pursued it. Hath reached me o auspicious king, that when the kafirs fell upon gharib."], ["580", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>And Shahrazad perceived the dawn of day and ceased saying her permitted say, when it was the six hundred and seventy seventh night she pursued, it hath reached me o auspicious king that when the kafirs fell upon harib.<|im_end|>", 0.6396347880363464, -0.15791653096675873, "And shahrazad perceived the dawn of day and ceased saying her permitted say. When it was the six hundred and seventy seventh night, she pursued it. Hath reached me o auspicious king, that when the kafirs fell upon gharib."], ["580", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>beasy would make reply but was from a certain person whom perhaps we need not name then the whiskey bottle would move forward like a pawn in chess and the next suaded words would be<|im_end|>", 0.8032140731811523, 0.47693824768066406, "deasey would make reply but twas from a certain person whom perhaps we need not name then the whiskey bottle would move forward like a pawn in chess and the next soothing words would be"], ["580", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>beasley would make reply, but was from a certain person whom perhaps we need not name then the whiskey bottle would move forward like a pawn in chess and the next soothing words would be<|im_end|>", 0.8078052401542664, 0.5542405247688293, "deasey would make reply but twas from a certain person whom perhaps we need not name then the whiskey bottle would move forward like a pawn in chess and the next soothing words would be"], ["580", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>these he would make reply, but was from a certain person whom perhaps we need not name then the whiskey bottle would move forward like a pawn in chess and the next suaded words would be<|im_end|>", 0.6860186457633972, -1.4963009357452393, "deasey would make reply but twas from a certain person whom perhaps we need not name then the whiskey bottle would move forward like a pawn in chess and the next soothing words would be"], ["580", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>hezekiah would make reply but was from a certain person whom perhaps we need not name then the whiskey bottle would move forward like a palm in chess and the next soothing words would be<|im_end|>", 0.8025121688842773, 0.4651201665401459, "deasey would make reply but twas from a certain person whom perhaps we need not name then the whiskey bottle would move forward like a pawn in chess and the next soothing words would be"], ["580", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>He did in fact begin it when setting out on the aforementioned second trip to Europe, calling it.<|im_end|>", 0.7412750124931335, -0.7827419638633728, "He did, in fact, begin it when setting out on the aforementioned second trip to europe, calling it."], ["580", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>He did, in fact, begin it when setting out on the aforementioned second trip to Europe calling it.<|im_end|>", 0.8706542253494263, 0.26100391149520874, "He did, in fact, begin it when setting out on the aforementioned second trip to europe, calling it."], ["580", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>He did, in fact, begin it when setting out on the aforementioned second trip to Europe, calling it.<|im_end|>", 1.0, 1.3044800758361816, "He did, in fact, begin it when setting out on the aforementioned second trip to europe, calling it."], ["580", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>He did in fact begin it when setting out on the aforementioned second trip to Europe, calling it.<|im_end|>", 0.7412750124931335, -0.7827419638633728, "He did, in fact, begin it when setting out on the aforementioned second trip to europe, calling it."], ["580", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Bayard knew that his master was upon him, and he started off upon a rapid pace. And in a few moments, he had galloped. Malagigi pretended to be in great alarm. O noble king and master, he cried, my poor companion has run away with. He will fall and break his neck.<|im_end|>", 0.45684748888015747, 1.159354329109192, "Bayard knew that his master was upon him, and he started off upon a rapid pace, and in a few moments was a good way off. Malagigi pretended to be in great alarm o, noble king and master. He cried, my poor companion is run away with he will fall and break his neck."], ["580", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Fayard knew that his master was upon him, and he started off upon a rapid pace. And in a few moments, he had galloped on. Malagigi pretended to be in great alarm. O noble king and master, he cried, my poor companion has run away with. He will fall and break his neck.<|im_end|>", 0.3951204717159271, -0.9790310263633728, "Bayard knew that his master was upon him, and he started off upon a rapid pace, and in a few moments was a good way off. Malagigi pretended to be in great alarm o, noble king and master. He cried, my poor companion is run away with he will fall and break his neck."], ["580", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Fayard knew that his master was upon him, and he started off upon a rapid pace. And in a few moments, he had galloped away. Malagigi pretended to be in great alarm. O noble king and master, he cried, my poor companion has run away with me. He will fall and break his neck.<|im_end|>", 0.4041914939880371, -0.6647871136665344, "Bayard knew that his master was upon him, and he started off upon a rapid pace, and in a few moments was a good way off. Malagigi pretended to be in great alarm o, noble king and master. He cried, my poor companion is run away with he will fall and break his neck."], ["580", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Vaillard knew that his master was upon him, and he started off upon a rapid pace. And in a few moments of he did run off malagigi pretended to be in great alarm. O noble king and master, he cried, my poor companion has run away with. He will fall and break his neck.<|im_end|>", 0.43736597895622253, 0.4844638407230377, "Bayard knew that his master was upon him, and he started off upon a rapid pace, and in a few moments was a good way off. Malagigi pretended to be in great alarm o, noble king and master. He cried, my poor companion is run away with he will fall and break his neck."], ["580", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>She laid a firm, delicate hand on her gold green jerkin. Ellidore. This was pleasant, but we got no nearer. We can't sit here and learn the language. Terry protested.<|im_end|>", 0.9188264608383179, 0.447922945022583, "She laid a firm, delicate hand on her gold green jerkin. Ellador, this was pleasant, but we got no nearer. We can't sit here and learn the language. Terry protested."], ["580", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>She laid a firm, delicate hand on her gold green jerkin. Ellador, this was pleasant. But we got no nearer. We can't sit here and learn the language. Terry protested.<|im_end|>", 0.9217362999916077, 0.5236092805862427, "She laid a firm, delicate hand on her gold green jerkin. Ellador, this was pleasant, but we got no nearer. We can't sit here and learn the language. Terry protested."], ["580", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>She laid a firm, delicate hand on her gold green jerkin ellador. This was pleasant, but we got no nearer. We can't sit here and learn the language. Terry protested.<|im_end|>", 0.8441234230995178, -1.4951399564743042, "She laid a firm, delicate hand on her gold green jerkin. Ellador, this was pleasant, but we got no nearer. We can't sit here and learn the language. Terry protested."], ["580", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>She laid a firm, delicate hand on her gold green jerkin. Ellador, this was pleasant. But we got no nearer. We can't sit here and learn the language. Terry protested.<|im_end|>", 0.9217362999916077, 0.5236092805862427, "She laid a firm, delicate hand on her gold green jerkin. Ellador, this was pleasant, but we got no nearer. We can't sit here and learn the language. Terry protested."], ["580", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>he cried out savage and fought and struggled two minutes however he did little against his four adversaries and worn out with his struggle flat suddenly from the dusty floor with emotion in spirit lost lost he muttered all lost<|im_end|>", 0.09937235713005066, 0.43719542026519775, "he cried out savagely and fought with the strength of two men however he could do little against his four adversaries and worn out with the struggle collapsed suddenly on to the dusty floor with a motion of despair lost lost he muttered all lost"], ["580", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>he cried out sadly and fought and strangled two men however he did little against four adversaries the worn out with his struggle flat suddenly upon the dusty floor with emotion in his spirit lost lost he muttered all lost<|im_end|>", 0.03799943998456001, -0.10167413204908371, "he cried out savagely and fought with the strength of two men however he could do little against his four adversaries and worn out with the struggle collapsed suddenly on to the dusty floor with a motion of despair lost lost he muttered all lost"], ["580", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>he cried out savage and fought and strangled two men however he did little against four adversaries and worn out with his struggle flat suddenly on the dusty floor with emotion in his spirit lost lost he muttered all lost<|im_end|>", 0.16370610892772675, 1.0020618438720703, "he cried out savagely and fought with the strength of two men however he could do little against his four adversaries and worn out with the struggle collapsed suddenly on to the dusty floor with a motion of despair lost lost he muttered all lost"], ["580", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>he cried out savagely and fought and struggled two minutes however with little against four adversaries and worn out of his breath, platt suddenly among the dusty floor with emotion in his spirit lost lost he muttered all lost<|im_end|>", -0.1027606725692749, -1.337583065032959, "he cried out savagely and fought with the strength of two men however he could do little against his four adversaries and worn out with the struggle collapsed suddenly on to the dusty floor with a motion of despair lost lost he muttered all lost"], ["580", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>And thus he accomplished this by the bye during the siege of the city, for he had his enemies in great contempt already. Nine when he had thus married Mariamne.<|im_end|>", 0.6356512308120728, -0.49875012040138245, "And thus he accomplished this by the by, during the siege of the city. For he had his enemies in great contempt already nine when he had thus married mariamne, he."], ["580", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>And thus he accomplished this by the bye during the siege of the city, for he had his enemies in great contempt already. Nine when he had thus married Mariamne.<|im_end|>", 0.6356512308120728, -0.49875012040138245, "And thus he accomplished this by the by, during the siege of the city. For he had his enemies in great contempt already nine when he had thus married mariamne, he."], ["580", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>And thus he accomplished this by the bye during the siege of the city, for he had his enemies in great contempt already nine when he had thus married mariamne.<|im_end|>", 0.715508222579956, 1.4962533712387085, "And thus he accomplished this by the by, during the siege of the city. For he had his enemies in great contempt already nine when he had thus married mariamne, he."], ["580", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>And thus he accomplished this by the bye during the siege of the city, for he had his enemies in great contempt already. Nine when he had thus married Mariamne.<|im_end|>", 0.6356512308120728, -0.49875012040138245, "And thus he accomplished this by the by, during the siege of the city. For he had his enemies in great contempt already nine when he had thus married mariamne, he."], ["580", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Putting both hands on her shoulders and looking into the brown eyes, should you be willing to go abroad with your mother and phronsie, mister king and jasper? Oh Polly gasped, but you.<|im_end|>", 0.9294845461845398, 0.7829669117927551, "Putting both hands on her shoulders and looking into the brown eyes, should you be willing to go abroad with your mother and phronsie, mister king and jasper? Oh, polly gasped, but you."], ["580", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Putting both hands on her shoulders and looking into the brown eyes, should you be willing to go abroad with your mother and phronsie mister king and jasper? Oh Polly gasped. But you.<|im_end|>", 0.7878445386886597, -1.3021132946014404, "Putting both hands on her shoulders and looking into the brown eyes, should you be willing to go abroad with your mother and phronsie, mister king and jasper? Oh, polly gasped, but you."], ["580", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Putting both hands on her shoulders and looking into the brown eyes, should you be willing to go abroad with your mother and phronsie, mister king and jasper? Oh Polly gasped, but you.<|im_end|>", 0.9294845461845398, 0.7829669117927551, "Putting both hands on her shoulders and looking into the brown eyes, should you be willing to go abroad with your mother and phronsie, mister king and jasper? Oh, polly gasped, but you."], ["580", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Putting both hands on her shoulders and looking into the brown eyes, should you be willing to go abroad with your mother and phronsie, mister king and jasper? Oh Polly gasped. But you.<|im_end|>", 0.858376145362854, -0.2638187110424042, "Putting both hands on her shoulders and looking into the brown eyes, should you be willing to go abroad with your mother and phronsie, mister king and jasper? Oh, polly gasped, but you."]]}
|
wandb/run-20260418_172847-c2a5hfz3/files/media/table/completions_297_2c3b42b29065c75ff192.table.json
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"columns": ["step", "prompt", "completion", "ASRWerSubLenCmpHalluDirtyV56", "advantages", "solution"], "data": [["595", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>The underling had insufficient, gave orders to the coachman and being readiness on the stairs took him up to his post. The steed balked and was about to kick the whip, ah, does he indicate?<|im_end|>", -0.5885342359542847, 0.47900471091270447, "You have the window. That is sufficient give orders to the coachman and be in readiness on the stairs to conduct us to it. The steward bowed and was about to quit the room. Ah continued the count."], ["595", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>The underling added sufficient, gave orders to the coachman and being readiness on the stairs took him up the steps. The steed balked and was about to caper, ah, it is a wonder good.<|im_end|>", -0.7021157145500183, 0.06742512434720993, "You have the window. That is sufficient give orders to the coachman and be in readiness on the stairs to conduct us to it. The steward bowed and was about to quit the room. Ah continued the count."], ["595", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>The underling was satisfied, gave orders to the coachman and being readiness on the stairs took him up the steps. The steed balked and was about to caper. Bah! Does he indeed?<|im_end|>", -0.7042824625968933, 0.05957358703017235, "You have the window. That is sufficient give orders to the coachman and be in readiness on the stairs to conduct us to it. The steward bowed and was about to quit the room. Ah continued the count."], ["595", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>The underling had insufficient the orders for capture and being readiness on the stairs took a left of straight the steed balked and was about to capitulate, ah, it is my defeat.<|im_end|>", -0.968815267086029, -0.899000883102417, "You have the window. That is sufficient give orders to the coachman and be in readiness on the stairs to conduct us to it. The steward bowed and was about to quit the room. Ah continued the count."], ["595", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>The underling had insufficient. He ordered for patron and being readiness on the stairs to connect his trunk, he steered back, and was about to return, but, as I indicated.<|im_end|>", -1.0357601642608643, -1.1415858268737793, "You have the window. That is sufficient give orders to the coachman and be in readiness on the stairs to conduct us to it. The steward bowed and was about to quit the room. Ah continued the count."], ["595", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>The underling was very sufficient. He ordered his detachment, and being readiness on the stairs took a left of straits. The steed balked and was about to fall off. Bah! There is no end to it.<|im_end|>", -1.0646944046020508, -1.2464333772659302, "You have the window. That is sufficient give orders to the coachman and be in readiness on the stairs to conduct us to it. The steward bowed and was about to quit the room. Ah continued the count."], ["595", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>The underling, and is sufficient. Give orders to the coachman in being readiness on the stairs to conduct us straight. The steer barked and was about to get up. Ah, there's a winded goat.<|im_end|>", -0.35244596004486084, 1.3345061540603638, "You have the window. That is sufficient give orders to the coachman and be in readiness on the stairs to conduct us to it. The steward bowed and was about to quit the room. Ah continued the count."], ["595", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>The underling was not sufficient. He ordered the patrol, and being readiness on the stairs, took him up the steps. The steamer backed, and he had about to put in, bah! There is no engine.<|im_end|>", -1.093247413635254, -1.3498995304107666, "You have the window. That is sufficient give orders to the coachman and be in readiness on the stairs to conduct us to it. The steward bowed and was about to quit the room. Ah continued the count."], ["595", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>The underling added sufficient, gave orders to the coachman and being readiness on the stairs took a left of stroke. The steer barked and was about to click away. Ah, there's my underling.<|im_end|>", -0.7040185928344727, 0.06052975729107857, "You have the window. That is sufficient give orders to the coachman and be in readiness on the stairs to conduct us to it. The steward bowed and was about to quit the room. Ah continued the count."], ["595", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>The underling, that is sufficient, give orders to the coachman and be in readiness on the stairs to conduct us straight. The steed balks when he is about to pick up baas, his wounded feet.<|im_end|>", -0.28640249371528625, 1.5738246440887451, "You have the window. That is sufficient give orders to the coachman and be in readiness on the stairs to conduct us to it. The steward bowed and was about to quit the room. Ah continued the count."], ["595", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>The underling had insufficient, gave orders to the coachman and being readiness on the stairs took him up the steps. The steed balked and was about to kick her, but his rider kicked.<|im_end|>", -0.7038772106170654, 0.06104207783937454, "You have the window. That is sufficient give orders to the coachman and be in readiness on the stairs to conduct us to it. The steward bowed and was about to quit the room. Ah continued the count."], ["595", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>The underling was satisfied, gave orders for the coachman and being readiness on the stairs to conduct us to it. The steed balked and laid about the cookelard, but his lamentations.<|im_end|>", -0.44447875022888184, 1.0010114908218384, "You have the window. That is sufficient give orders to the coachman and be in readiness on the stairs to conduct us to it. The steward bowed and was about to quit the room. Ah continued the count."], ["595", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>About three claims to hand tom was familiar with most of these claims, but occasionally would see a new one that excited his curiosity. However, he was more interested in what Andy Foger had to manage andy's machine had not been tried. Tom Warner only dared risk five minutes.<|im_end|>", 0.0947486162185669, 0.5240245461463928, "With three planes behind. Tom was familiar with most of these types, but occasionally he saw a new one that excited his curiosity. However, he was more interested in what andy foger would turn out. Andy's machine had not been tried, and tom wondered how he dared risk flying in it."], ["595", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>But three claims to hands, tom was familiar with most of these claims, but occasionally would see a new one that excited his curiosity. However, he was more interested in what Andy Foger had to invent. Andy's machine had not been tried. Tom Warner only dared risk five minutes.<|im_end|>", 0.09490512311458588, 0.5261728763580322, "With three planes behind. Tom was familiar with most of these types, but occasionally he saw a new one that excited his curiosity. However, he was more interested in what andy foger would turn out. Andy's machine had not been tried, and tom wondered how he dared risk flying in it."], ["595", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>At three claims to hand, Tom was familiar with most of these claims, but occasionally would see a new one that excited his curiosity. However, he was more interested in what Andy Foger had to invent. Andy's machine had not been tried. Tom Warner only dared it once for five minutes.<|im_end|>", -0.04116278141736984, -1.3415790796279907, "With three planes behind. Tom was familiar with most of these types, but occasionally he saw a new one that excited his curiosity. However, he was more interested in what andy foger would turn out. Andy's machine had not been tried, and tom wondered how he dared risk flying in it."], ["595", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>About three claims to hand, tom was familiar with most of these claims, but occasionally would see a new one that excited his curiosity. However, he was more interested in what Andy Foger had to manage. Andy's machine had not been tried. Tom Warner only dared risk flying minutes.<|im_end|>", 0.15220792591571808, 1.3127464056015015, "With three planes behind. Tom was familiar with most of these types, but occasionally he saw a new one that excited his curiosity. However, he was more interested in what andy foger would turn out. Andy's machine had not been tried, and tom wondered how he dared risk flying in it."], ["595", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>About three claims to hand, tom was familiar with most of these claims, but occasionally would see a new one that excited his curiosity. However, he was more interested in what Andy Foger had to manage. Andy's machinery had not been tried. Tom wondered why the era was applying minutes.<|im_end|>", -0.027287397533655167, -1.1511170864105225, "With three planes behind. Tom was familiar with most of these types, but occasionally he saw a new one that excited his curiosity. However, he was more interested in what andy foger would turn out. Andy's machine had not been tried, and tom wondered how he dared risk flying in it."], ["595", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>But three claims to hand tom was familiar with most of these claims, but occasionally would see a new one that excited his curiosity. However, he was more interested in what Andy Foger had to invent. Andy's machine had not been tried. Tom Warner only dared risk flying minutes.<|im_end|>", 0.153399258852005, 1.329099416732788, "With three planes behind. Tom was familiar with most of these types, but occasionally he saw a new one that excited his curiosity. However, he was more interested in what andy foger would turn out. Andy's machine had not been tried, and tom wondered how he dared risk flying in it."], ["595", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>But three claims to hand tom was familiar with most of these claims, but occasionally would see a new one that excited his curiosity. However, he was more interested in what Andy Foger had to manage. Andy's machine had not been tried. Tom Warner only dared risk flying minutes.<|im_end|>", 0.1526142656803131, 1.318324089050293, "With three planes behind. Tom was familiar with most of these types, but occasionally he saw a new one that excited his curiosity. However, he was more interested in what andy foger would turn out. Andy's machine had not been tried, and tom wondered how he dared risk flying in it."], ["595", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>But three claims to hand tom was familiar with most of these claims, but occasionally would see a new one that excited his curiosity. However, he was more interested in what Andy Foger had to invent. Andy's machine had not been tried. Tom Warner would only dare to risk five minutes.<|im_end|>", -0.037495389580726624, -1.2912381887435913, "With three planes behind. Tom was familiar with most of these types, but occasionally he saw a new one that excited his curiosity. However, he was more interested in what andy foger would turn out. Andy's machine had not been tried, and tom wondered how he dared risk flying in it."], ["595", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>About three claims to hand tom was familiar with most of these claims, but occasionally would see a new one that excited his curiosity. However, he was more interested in what Andy Foger had to manage andy's machine had not been tried. Tom marvelled at the daring riskful flying minutes.<|im_end|>", 0.026256464421749115, -0.41614094376564026, "With three planes behind. Tom was familiar with most of these types, but occasionally he saw a new one that excited his curiosity. However, he was more interested in what andy foger would turn out. Andy's machine had not been tried, and tom wondered how he dared risk flying in it."], ["595", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>At three times the hands tom was familiar with most of these points, but occasionally would see a new one that excited his curiosity. However, he was more interested in what Andy Foger had to invent. Andy's machine had not been tried. Tom Warner would only dare risk five minutes.<|im_end|>", 0.03246723860502243, -0.330888032913208, "With three planes behind. Tom was familiar with most of these types, but occasionally he saw a new one that excited his curiosity. However, he was more interested in what andy foger would turn out. Andy's machine had not been tried, and tom wondered how he dared risk flying in it."], ["595", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>At three times to hand tom was familiar with most of these points, but occasionally would see a new one that excited his curiosity. However, he was more interested in what Andy Foger was doing. Andy's machine had not been tried. Tom Warner only dared to whistle five minutes.<|im_end|>", 0.04056717827916145, -0.21970325708389282, "With three planes behind. Tom was familiar with most of these types, but occasionally he saw a new one that excited his curiosity. However, he was more interested in what andy foger would turn out. Andy's machine had not been tried, and tom wondered how he dared risk flying in it."], ["595", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>About three claims to hand tom was familiar with most of these claims, but occasionally would see a new one that excited his curiosity. However, he was more interested in what Andy Foger had to manage andy's machinery had not been tried. Tom Warner only dared risk five minutes.<|im_end|>", 0.03765326738357544, -0.2597014009952545, "With three planes behind. Tom was familiar with most of these types, but occasionally he saw a new one that excited his curiosity. However, he was more interested in what andy foger would turn out. Andy's machine had not been tried, and tom wondered how he dared risk flying in it."], ["595", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Even had they wished to do it, which remains doubtful. She came behind the wicked grovendam and twisted her neck just as a quick bell of iron dared aspire.<|im_end|>", 0.1723645180463791, -0.36288517713546753, "Even had they wished to do it, which remains doubtful, she came behind the wicked grognon and twisted her neck, just as a cook does a barn door fowl."], ["595", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Even had they wished to do it, which remains doubtful. She came behind the wicked greggong and twisted her neck just as a quick bell of iron gave a sigh.<|im_end|>", 0.09226466715335846, -1.601252555847168, "Even had they wished to do it, which remains doubtful, she came behind the wicked grognon and twisted her neck, just as a cook does a barn door fowl."], ["595", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Even had they wished to do it, which remains doubtful, she came behind the wicked grovden and twisted her neck just as a quick bell of burning barrel fire.<|im_end|>", 0.27071085572242737, 1.1575783491134644, "Even had they wished to do it, which remains doubtful, she came behind the wicked grognon and twisted her neck, just as a cook does a barn door fowl."], ["595", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Even had they wished to do it, which remains doubtful, she came behind the wicked grovding and twisted her neck just as a quick bell of iron dare fire.<|im_end|>", 0.27202051877975464, 1.177826166152954, "Even had they wished to do it, which remains doubtful, she came behind the wicked grognon and twisted her neck, just as a cook does a barn door fowl."], ["595", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Even had they wished to do it, which remains doubtful she came behind the wicked greggion and twisted her neck just as a quick bell of iron dared fire.<|im_end|>", 0.1751171350479126, -0.32032889127731323, "Even had they wished to do it, which remains doubtful, she came behind the wicked grognon and twisted her neck, just as a cook does a barn door fowl."], ["595", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Even had they wished to do it, which remains doubtful, she came behind the wicked greggion and twisted her neck just as a quick bell of burning death died.<|im_end|>", 0.26866206526756287, 1.1259034872055054, "Even had they wished to do it, which remains doubtful, she came behind the wicked grognon and twisted her neck, just as a cook does a barn door fowl."], ["595", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Even had they wished to do it, which remains doubtful, she came behind the wicked gregg dawn and twisted her neck just as a quick bell of iron dare fire.<|im_end|>", 0.19315652549266815, -0.04143457114696503, "Even had they wished to do it, which remains doubtful, she came behind the wicked grognon and twisted her neck, just as a cook does a barn door fowl."], ["595", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Even had they wished to do it, which remains doubtful. She came behind the wicked grovendal and twisted her neck just as a quick bell of iron dared fire.<|im_end|>", 0.17351007461547852, -0.34517452120780945, "Even had they wished to do it, which remains doubtful, she came behind the wicked grognon and twisted her neck, just as a cook does a barn door fowl."], ["595", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Even had they wished to do it, which remains doubtful. She came behind the wicked gregg dawn and twisted her neck just as a quick bell of barren derrick sound.<|im_end|>", 0.09223079681396484, -1.6017762422561646, "Even had they wished to do it, which remains doubtful, she came behind the wicked grognon and twisted her neck, just as a cook does a barn door fowl."], ["595", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Even had they wished to do it, which remains doubtful. She came behind the wicked greggong and twisted her neck just as a quick bell of ironbare fire.<|im_end|>", 0.19122624397277832, -0.07127729803323746, "Even had they wished to do it, which remains doubtful, she came behind the wicked grognon and twisted her neck, just as a cook does a barn door fowl."], ["595", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Even had they wished to do it, which remains doubtful, she came behind the wicked grogman and twisted her neck just as a quick bell of burning barrel fire.<|im_end|>", 0.2721707224845886, 1.1801483631134033, "Even had they wished to do it, which remains doubtful, she came behind the wicked grognon and twisted her neck, just as a cook does a barn door fowl."], ["595", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Even had they wished to do it, which remains doubtful. She came behind the wicked grogman and twisted her neck just as a quick bell of iron dared sound.<|im_end|>", 0.17660479247570038, -0.29732927680015564, "Even had they wished to do it, which remains doubtful, she came behind the wicked grognon and twisted her neck, just as a cook does a barn door fowl."], ["595", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Though just yet none ventured to follow us, it was as though they felt that to do so would be crossing their own line. I wonder whether they might have considered this with any intrepidation or perhaps sullen satisfaction if they had had any chance to reward anybody for following me.<|im_end|>", -0.30214083194732666, -0.016384782269597054, "Though just yet none ventured to follow us. It was as though they felt that to do so was like crossing a dead line. I wondered which one of them might be looking at us with inward trepidation, or perhaps satisfaction, if there had been any chance to remove anything incriminating."], ["595", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Though just yet none ventured to follow us, it was as though they felt that to do so would be crossing their beloved. I wondered whether they might have considered this with any trepidation or perhaps self hatred if they had had any chance to avoid any further trouble.<|im_end|>", -0.24527063965797424, 0.48843005299568176, "Though just yet none ventured to follow us. It was as though they felt that to do so was like crossing a dead line. I wondered which one of them might be looking at us with inward trepidation, or perhaps satisfaction, if there had been any chance to remove anything incriminating."], ["595", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Though just yet none ventured to follow us, it was as though they felt that to do so would be crossing their beloved I wondered whether they might have acknowledged with any approbation or perhaps satisfaction if they had had any chance to reward anybody for coming.<|im_end|>", -0.18428294360637665, 1.0297943353652954, "Though just yet none ventured to follow us. It was as though they felt that to do so was like crossing a dead line. I wondered which one of them might be looking at us with inward trepidation, or perhaps satisfaction, if there had been any chance to remove anything incriminating."], ["595", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Though just yet none ventured to follow us, it was as though they felt the security of that crossing had been lost. I wondered whether they might have evaded us with any more deliberation or perhaps fast fetched if they had had any chance to avoid anything approaching me.<|im_end|>", -0.40226879715919495, -0.9051822423934937, "Though just yet none ventured to follow us. It was as though they felt that to do so was like crossing a dead line. I wondered which one of them might be looking at us with inward trepidation, or perhaps satisfaction, if there had been any chance to remove anything incriminating."], ["595", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Though just yet, none ventured to follow us. It was as though they felt it to be folly without crossing the blue line. I wondered whether they might have evaded us with any more preparation, or perhaps fell afresh if they had got any chance to avoid anything before them.<|im_end|>", -0.29436060786247253, 0.052677273750305176, "Though just yet none ventured to follow us. It was as though they felt that to do so was like crossing a dead line. I wondered which one of them might be looking at us with inward trepidation, or perhaps satisfaction, if there had been any chance to remove anything incriminating."], ["595", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Though just yet, none ventured to follow us. It was as though they felt it to be folly that crossing the blue line. I wondered if even then my little visitors would any more trepidation or perhaps self hatred, if they had but any chance to avoid anything like fear.<|im_end|>", -0.45500248670578003, -1.3732788562774658, "Though just yet none ventured to follow us. It was as though they felt that to do so was like crossing a dead line. I wondered which one of them might be looking at us with inward trepidation, or perhaps satisfaction, if there had been any chance to remove anything incriminating."], ["595", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Though just yet none ventured to follow us, it was as though they felt that to do so would be crossing their beloved. I wondered whether they might have encountered us with any more trepidation or perhaps sarsfetched if they had had any chance to avoid anybody in the crowd.<|im_end|>", -0.23299074172973633, 0.5974339842796326, "Though just yet none ventured to follow us. It was as though they felt that to do so was like crossing a dead line. I wondered which one of them might be looking at us with inward trepidation, or perhaps satisfaction, if there had been any chance to remove anything incriminating."], ["595", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Though just yet, none ventured to follow us. It was as though they felt that to do so would be crossing their beloved. I wondered whether they might have lived with us in more consideration or perhaps satisfied if they had had any chance to reward anybody for coming.<|im_end|>", -0.2098255306482315, 0.8030626773834229, "Though just yet none ventured to follow us. It was as though they felt that to do so was like crossing a dead line. I wondered which one of them might be looking at us with inward trepidation, or perhaps satisfaction, if there had been any chance to remove anything incriminating."], ["595", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Though just yet, none ventured to follow us. It was as though they felt it to be far as if crossing forbidden lines. I wondered whether they might have evaded us with equal precipitation, or perhaps fast fetched, if they had but any chance to avoid anything from following.<|im_end|>", -0.3078778386116028, -0.06730998307466507, "Though just yet none ventured to follow us. It was as though they felt that to do so was like crossing a dead line. I wondered which one of them might be looking at us with inward trepidation, or perhaps satisfaction, if there had been any chance to remove anything incriminating."], ["595", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Though just yet, none ventured to follow us. It was as though they felt it would be folly without crossing the blue line. I wondered whether they might have regarded us with any trepidation, or perhaps, self-reproach, if they had had any chance to observe anything of our manner.<|im_end|>", -0.30904507637023926, -0.0776711031794548, "Though just yet none ventured to follow us. It was as though they felt that to do so was like crossing a dead line. I wondered which one of them might be looking at us with inward trepidation, or perhaps satisfaction, if there had been any chance to remove anything incriminating."], ["595", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Though just yet, none ventured to follow us. It was as though they felt it to be folly to cross over the divide. I wonder whether they might have lived with us any more. Preparation or perhaps self, fetched if they had had any chance to avoid anything from harm.<|im_end|>", -0.5224043726921082, -1.9715795516967773, "Though just yet none ventured to follow us. It was as though they felt that to do so was like crossing a dead line. I wondered which one of them might be looking at us with inward trepidation, or perhaps satisfaction, if there had been any chance to remove anything incriminating."], ["595", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Though just yet none ventured to follow us, it was as though they felt that to do so would be crossing their own line. I wondered whether they might have taken us with any more trepidation or perhaps sarsfetched if they had had any chance to avoid anybody pursuing them.<|im_end|>", -0.13807019591331482, 1.440007209777832, "Though just yet none ventured to follow us. It was as though they felt that to do so was like crossing a dead line. I wondered which one of them might be looking at us with inward trepidation, or perhaps satisfaction, if there had been any chance to remove anything incriminating."]]}
|
wandb/run-20260418_172847-c2a5hfz3/files/media/table/completions_325_dedd0bb2cd2d27e14a92.table.json
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"columns": ["step", "prompt", "completion", "ASRWerSubLenCmpHalluDirtyV56", "advantages", "solution"], "data": [["650", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>But that, that's the same old lying doll thing. London is like a port of the sea place of temptation, there's pitfalls for men and traps for money in every turn, as I've heard say.<|im_end|>", -0.4760620892047882, 0.19658391177654266, "But if that's the frame o mind thou'rt in lunnon is like for to be a sore place o temptation. There's pitfalls for men and traps for money at ivery turn. As I've heerd say."], ["650", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>But that's the same old lying down I do running is like a port of the sole place of temptation there's pitfalls for men and traps for money in every turn, as I've got said.<|im_end|>", -0.6135305762290955, -0.7280290126800537, "But if that's the frame o mind thou'rt in lunnon is like for to be a sore place o temptation. There's pitfalls for men and traps for money at ivery turn. As I've heerd say."], ["650", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>But that that's the same, a lying gal. I think running is likely more to be a safe place of temptation there's pitfalls for men and traps for money in every turn as i've heard say.<|im_end|>", -0.35690099000930786, 0.9980613589286804, "But if that's the frame o mind thou'rt in lunnon is like for to be a sore place o temptation. There's pitfalls for men and traps for money at ivery turn. As I've heerd say."], ["650", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>But that's the same old lying gallant thing running his life for to be a safe place of temptation, there's pitfalls for men and traps for money in every turn as I've got said.<|im_end|>", -0.3606083393096924, 0.973125696182251, "But if that's the frame o mind thou'rt in lunnon is like for to be a sore place o temptation. There's pitfalls for men and traps for money at ivery turn. As I've heerd say."], ["650", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>But if that's the same a lion, thou art in running is like as well to the escape place of temptation, there's pitfalls for men and traps for money in every turn, as I thought fit.<|im_end|>", -0.5472695827484131, -0.2823576331138611, "But if that's the frame o mind thou'rt in lunnon is like for to be a sore place o temptation. There's pitfalls for men and traps for money at ivery turn. As I've heerd say."], ["650", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>But that, that's the same old lying doll thing running his life for to be a safe place of temptation. There's pitfalls for men and traps for money in every turn as I've heard said.<|im_end|>", -0.28626200556755066, 1.4731791019439697, "But if that's the frame o mind thou'rt in lunnon is like for to be a sore place o temptation. There's pitfalls for men and traps for money at ivery turn. As I've heerd say."], ["650", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>But that's the same old lying gal again. London is like a port of the sea, place of temptation, there's pitfalls for money and traps for money in every turn as I've said before.<|im_end|>", -0.6403212547302246, -0.9082230925559998, "But if that's the frame o mind thou'rt in lunnon is like for to be a sore place o temptation. There's pitfalls for men and traps for money at ivery turn. As I've heerd say."], ["650", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>But that, that's the same old lion. Thou art in London is like a port to the sea place of temptation. There's pitfalls for men and traps for money in every turn, as I thought fit.<|im_end|>", -0.5447036623954773, -0.26509925723075867, "But if that's the frame o mind thou'rt in lunnon is like for to be a sore place o temptation. There's pitfalls for men and traps for money at ivery turn. As I've heerd say."], ["650", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>But if that's the same, a lion bawling running is likely more to be a safe place of temptation there's pitfalls for men and traps for money in every turn as I have said before.<|im_end|>", -0.42995119094848633, 0.5067257881164551, "But if that's the frame o mind thou'rt in lunnon is like for to be a sore place o temptation. There's pitfalls for men and traps for money at ivery turn. As I've heerd say."], ["650", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>But if that's the same old lion, thou art in running is like a sport of the ill place of temptation. There's pitfalls for men and traps for money in every turn as I thought said.<|im_end|>", -0.45117539167404175, 0.3639717996120453, "But if that's the frame o mind thou'rt in lunnon is like for to be a sore place o temptation. There's pitfalls for men and traps for money at ivery turn. As I've heerd say."], ["650", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>But that, that's the same old lying gal up in London is like a port of the sea place of temptation. There's pitfalls for money and traps for money in every turn as I've got to say.<|im_end|>", -0.5213723182678223, -0.10817265510559082, "But if that's the frame o mind thou'rt in lunnon is like for to be a sore place o temptation. There's pitfalls for men and traps for money at ivery turn. As I've heerd say."], ["650", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>But that, that's the same old lion gallant thing runnin his life all through this old place of temptation, there's pitfalls for men and traps for men in every turn as I've got said.<|im_end|>", -0.8353171944618225, -2.2197656631469727, "But if that's the frame o mind thou'rt in lunnon is like for to be a sore place o temptation. There's pitfalls for men and traps for money at ivery turn. As I've heerd say."], ["650", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>i saw but few inhabitants during my excursion and i met a crowd of them actually drying and salting and loading codfish, the principal article of exportation<|im_end|>", 0.450447678565979, 1.2203410863876343, "i saw but few inhabitants during my excursion but i met a crowd on the beach drying salting and loading codfish the principal article of exportation"], ["650", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>i saw but few inhabitants during my excursion and i met a crowd of them actually drying and salting and roasting codfish, the principal article of exportation<|im_end|>", 0.34390777349472046, 0.75895094871521, "i saw but few inhabitants during my excursion but i met a crowd on the beach drying salting and loading codfish the principal article of exportation"], ["650", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>i saw but few inhabitants during my excursion and i met a crowd of them actually drying and salting and roasting codfish, the principal article of exportation<|im_end|>", 0.34390777349472046, 0.75895094871521, "i saw but few inhabitants during my excursion but i met a crowd on the beach drying salting and loading codfish the principal article of exportation"], ["650", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>i saw but few inhabitants during my excursion and i met a crowd of them actually drying and salting and roasting codfish the principal article of exportation<|im_end|>", 0.4490084648132324, 1.2141083478927612, "i saw but few inhabitants during my excursion but i met a crowd on the beach drying salting and loading codfish the principal article of exportation"], ["650", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>i saw but few inhabitants during my excursion, and i met a crowd of them actually dried and salted in loaded codfish, the principal article of exportation<|im_end|>", -0.09839683026075363, -1.1565287113189697, "i saw but few inhabitants during my excursion but i met a crowd on the beach drying salting and loading codfish the principal article of exportation"], ["650", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>i saw but few inhabitants during my excursion and i met a crowd of them actually dried and salted and loaded with codfish, the principal article of exportation<|im_end|>", 0.03567298501729965, -0.5759153366088867, "i saw but few inhabitants during my excursion but i met a crowd on the beach drying salting and loading codfish the principal article of exportation"], ["650", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>i saw but few inhabitants during my excursion and i met a crowd of them actually drying and salting and loading codfish, the principal article of exportation<|im_end|>", 0.450447678565979, 1.2203410863876343, "i saw but few inhabitants during my excursion but i met a crowd on the beach drying salting and loading codfish the principal article of exportation"], ["650", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>i saw but few inhabitants during my excursion and i met a crowd of them actually dried and salted and loaded in pot dishes the principal article of exportation<|im_end|>", -0.0665484219789505, -1.0186035633087158, "i saw but few inhabitants during my excursion but i met a crowd on the beach drying salting and loading codfish the principal article of exportation"], ["650", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>i saw but few inhabitants during my excursion and i met a crowd of them actually dried and salted and loaded with codfish, the principal article of exportation<|im_end|>", 0.03567298501729965, -0.5759153366088867, "i saw but few inhabitants during my excursion but i met a crowd on the beach drying salting and loading codfish the principal article of exportation"], ["650", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>i saw but few inhabitants during my excursion and i met a crowd of the actually dried and salted and loaded codfish, the principal article of exportation<|im_end|>", 0.23414531350135803, 0.28360486030578613, "i saw but few inhabitants during my excursion but i met a crowd on the beach drying salting and loading codfish the principal article of exportation"], ["650", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>i saw but few inhabitants during my excursion and i met a crowd of them actually dried and salted in woven pot dishes the principal article of exportation<|im_end|>", -0.07731880247592926, -1.06524658203125, "i saw but few inhabitants during my excursion but i met a crowd on the beach drying salting and loading codfish the principal article of exportation"], ["650", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>i saw but few inhabitants during my excursion and i met a crowd of them actually dried and salted in wooden pot dishes, the principal article of exportation<|im_end|>", -0.07705149054527283, -1.0640889406204224, "i saw but few inhabitants during my excursion but i met a crowd on the beach drying salting and loading codfish the principal article of exportation"], ["650", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>to allow her to derive encouragement from a preference only given her because her real situation was so different but that it was so probably declared by lucie's eyes on the trump that it was declared over in the next moment more evidently<|im_end|>", 0.18845127522945404, 0.42637088894844055, "or to allow her to derive encouragement from a preference only given her because her real situation was unknown but that it was so had not only been declared by lucy's eyes at the time but was declared over again the next morning more openly"], ["650", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>to allow marge and her rival encouragement with a preference only in it because her real situation was a thinner one, but that it was so probably been declared by lucy's eyes on the trumpet that it was declared over again next morning more evidently<|im_end|>", -0.10559716075658798, -1.9492686986923218, "or to allow her to derive encouragement from a preference only given her because her real situation was unknown but that it was so had not only been declared by lucy's eyes at the time but was declared over again the next morning more openly"], ["650", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>to allow her to derive encouragement from a preference only in her because her real situation was so different but that it was so probably been declared by lucy's eyes on the trump, that it was declared over again next morning more evidently<|im_end|>", 0.3131347894668579, 1.4336984157562256, "or to allow her to derive encouragement from a preference only given her because her real situation was unknown but that it was so had not only been declared by lucy's eyes at the time but was declared over again the next morning more openly"], ["650", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>to allow her to derive encouragement from a preference, only in her because her real situation was so different, but that it was so probably been declared by lucy's eyes on the triumph, that it was declared over again next morning more evidently<|im_end|>", 0.2516788840293884, 0.9371914863586426, "or to allow her to derive encouragement from a preference only given her because her real situation was unknown but that it was so had not only been declared by lucy's eyes at the time but was declared over again the next morning more openly"], ["650", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>to allow her to derive encouragement from a preference only in her because her own situation was so different but that it was so probably been declared by lucas eyes on the trumpet that it was declared over and over again more evidently<|im_end|>", 0.00036666117375716567, -1.0931788682937622, "or to allow her to derive encouragement from a preference only given her because her real situation was unknown but that it was so had not only been declared by lucy's eyes at the time but was declared over again the next morning more openly"], ["650", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>to allow her to derive encouragement from a preference only given her because her good situation was limited, but that it was so probably been declared by lucas eyes on the trump, that it was declared over in the next moment more evidently<|im_end|>", 0.2317005693912506, 0.7757852077484131, "or to allow her to derive encouragement from a preference only given her because her real situation was unknown but that it was so had not only been declared by lucy's eyes at the time but was declared over again the next morning more openly"], ["650", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>to allow her to derive encouragement from a preference only in her because her real situation was so different but that it was so probably been declared by lucy's eyes on the triumph then was declared over and an excellent evening more evident<|im_end|>", 0.17100711166858673, 0.2854381799697876, "or to allow her to derive encouragement from a preference only given her because her real situation was unknown but that it was so had not only been declared by lucy's eyes at the time but was declared over again the next morning more openly"], ["650", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>to allow her to derive encouragement from a preference only given her because her own situation was so thin but that it was so probably declared by lucy's eyes on trump that it was declared over in an excellent and warm oven.<|im_end|>", -0.01022692583501339, -1.1787652969360352, "or to allow her to derive encouragement from a preference only given her because her real situation was unknown but that it was so had not only been declared by lucy's eyes at the time but was declared over again the next morning more openly"], ["650", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>to allow her to derive encouragement from a preference only in her because her good situation was slender but that it was so probably been declared by lucas eyes on the trump then was declared over and annexed to even more evidently<|im_end|>", 0.09647921472787857, -0.31667831540107727, "or to allow her to derive encouragement from a preference only given her because her real situation was unknown but that it was so had not only been declared by lucy's eyes at the time but was declared over again the next morning more openly"], ["650", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>to allow her to derive encouragement from a preference, only in her because her own situation was so limited, but that it was so probably been declared by lucy's eyes on the trump, and was declared over again next morning more evidently<|im_end|>", 0.23830121755599976, 0.8291123509407043, "or to allow her to derive encouragement from a preference only given her because her real situation was unknown but that it was so had not only been declared by lucy's eyes at the time but was declared over again the next morning more openly"], ["650", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>to allow her to derive encouragement from a preference only in her because her real situation was so thin but that it was so probably been declared by lucy's eyes on the truant that it was declared over evident and explained more evidently<|im_end|>", 0.12768252193927765, -0.06458445638418198, "or to allow her to derive encouragement from a preference only given her because her real situation was unknown but that it was so had not only been declared by lucy's eyes at the time but was declared over again the next morning more openly"], ["650", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>to allow her to derive encouragement from a preference only in her because her real situation was so different but that it was so probably been declared by lucy's eyes on the trumpet, that it was declared over and an excellently more evidently<|im_end|>", 0.12514056265354156, -0.08512113988399506, "or to allow her to derive encouragement from a preference only given her because her real situation was unknown but that it was so had not only been declared by lucy's eyes at the time but was declared over again the next morning more openly"], ["650", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>In a very short time, you would have laughed to a song if I saw yesterday Emmett did not know whether she was on her head or heels in such a hurry to tell him great news.<|im_end|>", 0.44709184765815735, -1.250040054321289, "In a very short time. You would have laughed to have seen what I saw yesterday. Emma did not know whether she was on her head or heels. In such a hurry to tell your great news."], ["650", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>In a very short time, you would have laughed to your sin if I saw yesterday Emmet did not know whether she was on her head or hands in such a hurry to tell you great news.<|im_end|>", 0.4470624029636383, -1.2503377199172974, "In a very short time. You would have laughed to have seen what I saw yesterday. Emma did not know whether she was on her head or heels. In such a hurry to tell your great news."], ["650", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>In a very short time you would have laughed to your sin if I saw yesterday Emmet did not know whether she was on her head or heels in such a hurry to tell you great news.<|im_end|>", 0.4515860378742218, -1.2046061754226685, "In a very short time. You would have laughed to have seen what I saw yesterday. Emma did not know whether she was on her head or heels. In such a hurry to tell your great news."], ["650", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>In a very short time, you would have laughed to see what I saw yesterday. Emmett did not know whether she was on her head or heels in such a hurry to tell your great news.<|im_end|>", 0.6924002766609192, 1.229895830154419, "In a very short time. You would have laughed to have seen what I saw yesterday. Emma did not know whether she was on her head or heels. In such a hurry to tell your great news."], ["650", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>In a very short time, you would have laughed to your sin that I saw yesterday. Emmet did not know whether she was on her head or thumbs in such a hurry to tell you great news.<|im_end|>", 0.5242686867713928, -0.4698238670825958, "In a very short time. You would have laughed to have seen what I saw yesterday. Emma did not know whether she was on her head or heels. In such a hurry to tell your great news."], ["650", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>In a very short time, you would have laughed to see what I saw yesterday. Emmet did not know whether she was on her head or heels in such a hurry to tell him great news.<|im_end|>", 0.6197176575660706, 0.4951137602329254, "In a very short time. You would have laughed to have seen what I saw yesterday. Emma did not know whether she was on her head or heels. In such a hurry to tell your great news."], ["650", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>In a very short time, you would have laughed to hear some of how I saw yesterday. Emmet did not know whether she was on her head or heels in such a hurry to tell your great news.<|im_end|>", 0.5412817597389221, -0.29783087968826294, "In a very short time. You would have laughed to have seen what I saw yesterday. Emma did not know whether she was on her head or heels. In such a hurry to tell your great news."], ["650", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>In a very short time, you would have laughed to listen to what I saw yesterday. Emmet did not know whether she was on her head or thumbs in such a hurry to tell your great news.<|im_end|>", 0.6698590517044067, 1.0020161867141724, "In a very short time. You would have laughed to have seen what I saw yesterday. Emma did not know whether she was on her head or heels. In such a hurry to tell your great news."], ["650", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>In a very short time, you would have laughed to your sin that I saw yesterday. Emmett did not know whether she was on her head or heels in such a hurry to tell him great news.<|im_end|>", 0.52790766954422, -0.4330357015132904, "In a very short time. You would have laughed to have seen what I saw yesterday. Emma did not know whether she was on her head or heels. In such a hurry to tell your great news."], ["650", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>In a very short time, you would have laughed to see what I saw yesterday. Emmet did not know whether she was on her head or heels in such a hurry to tell your great news.<|im_end|>", 0.693012535572052, 1.2360854148864746, "In a very short time. You would have laughed to have seen what I saw yesterday. Emma did not know whether she was on her head or heels. In such a hurry to tell your great news."], ["650", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>In a very short time, you would have laughed to see what I saw yesterday. Emmet did not know whether she was on her head or heels in such a hurry to tell your great news.<|im_end|>", 0.693012535572052, 1.2360854148864746, "In a very short time. You would have laughed to have seen what I saw yesterday. Emma did not know whether she was on her head or heels. In such a hurry to tell your great news."], ["650", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>In a very short time, you would have laughed to a sing of how I saw yesterday. Emmet did not know whether she was on her head or heels in such a hurry to tell your great news.<|im_end|>", 0.5417073369026184, -0.2935284972190857, "In a very short time. You would have laughed to have seen what I saw yesterday. Emma did not know whether she was on her head or heels. In such a hurry to tell your great news."]]}
|
wandb/run-20260418_172847-c2a5hfz3/files/media/table/completions_331_10c4aed0f625c56bd04d.table.json
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"columns": ["step", "prompt", "completion", "ASRWerSubLenCmpHalluDirtyV56", "advantages", "solution"], "data": [["660", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Captain marking, it's about about my wife. Polly answered, casting down her eyes and returning very red. The other gave a whistle.<|im_end|>", 0.5489940643310547, 0.10889305174350739, "Captain marker, it's about about my wife. Crawley answered, casting down his eyes and turning very red. The other gave a whistle."], ["660", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Captain marten, it's about about my wife. Crawley answered, casting down his eyes and returning a very red. The other gave a whistle.<|im_end|>", 0.7004733681678772, 1.3730005025863647, "Captain marker, it's about about my wife. Crawley answered, casting down his eyes and turning very red. The other gave a whistle."], ["660", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Captain marten, it's about about my wife. Crawley answered, casting down his eyes and returning a very red. The other day, the whistle.<|im_end|>", 0.4469512701034546, -0.7426625490188599, "Captain marker, it's about about my wife. Crawley answered, casting down his eyes and turning very red. The other gave a whistle."], ["660", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Captain markham, it's about about my wife. Crawley answered, casting down his eyes and returning a very red. The other day, the whistle.<|im_end|>", 0.44736266136169434, -0.7392294406890869, "Captain marker, it's about about my wife. Crawley answered, casting down his eyes and turning very red. The other gave a whistle."], ["660", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>At evening upon the world, while others hint that knowledge of these might undo our civilization, there watched him ceaselessly from the underpits those eyes whose duty it is, from further within and deeper.<|im_end|>", 0.8165187239646912, -1.213279128074646, "At evening upon the world, while others hint that knowledge of these might undo our civilization, there watched him ceaselessly from the under pits, those eyes whose duty it is from further within and deeper."], ["660", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>At evening upon the world, while others hint that knowledge of these might undo our civilization, there watched him ceaselessly from the under pits those eyes whose duty it is from further within and deeper.<|im_end|>", 0.9336058497428894, 1.213279128074646, "At evening upon the world, while others hint that knowledge of these might undo our civilization, there watched him ceaselessly from the under pits, those eyes whose duty it is from further within and deeper."], ["660", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>At evening upon the world, while others hint that knowledge of these might undo our civilization, there watched him ceaselessly from the underpits those eyes whose duty it is from further within and deeper.<|im_end|>", 0.8821772933006287, 0.14745411276817322, "At evening upon the world, while others hint that knowledge of these might undo our civilization, there watched him ceaselessly from the under pits, those eyes whose duty it is from further within and deeper."], ["660", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>At evening upon the world, while others hint that knowledge of these might undo our civilization, there watched him ceaselessly from the under pits those eyes whose duty it is, from further within and deeper.<|im_end|>", 0.8679472804069519, -0.14745411276817322, "At evening upon the world, while others hint that knowledge of these might undo our civilization, there watched him ceaselessly from the under pits, those eyes whose duty it is from further within and deeper."], ["660", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Milly steered her magnificent way like some great liner cleaving among the canoes of howling savages. Our goddess of grub was built on lines so majestic that they could be followed only with awe.<|im_end|>", 1.0, 0.0, "Milly steered her magnificent way like some great liner cleaving among the canoes of howling savages. Our goddess of grub was built on lines so majestic that they could be followed only with awe."], ["660", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Milly steered her magnificent way like some great liner cleaving among the canoes of howling savages. Our goddess of grub was built on lines so majestic that they could be followed only with awe.<|im_end|>", 1.0, 0.0, "Milly steered her magnificent way like some great liner cleaving among the canoes of howling savages. Our goddess of grub was built on lines so majestic that they could be followed only with awe."], ["660", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Milly steered her magnificent way like some great liner cleaving among the canoes of howling savages. Our goddess of grub was built on lines so majestic that they could be followed only with awe.<|im_end|>", 1.0, 0.0, "Milly steered her magnificent way like some great liner cleaving among the canoes of howling savages. Our goddess of grub was built on lines so majestic that they could be followed only with awe."], ["660", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Milly steered her magnificent way like some great liner cleaving among the canoes of howling savages. Our goddess of grub was built on lines so majestic that they could be followed only with awe.<|im_end|>", 1.0, 0.0, "Milly steered her magnificent way like some great liner cleaving among the canoes of howling savages. Our goddess of grub was built on lines so majestic that they could be followed only with awe."], ["660", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>And make properly lavish time after working hard, it is not improbable that glossy buttons are a valid feature of the garb of a humdrum and harassed hospital portmanteau many intellect.<|im_end|>", 0.26788923144340515, -1.226920247077942, "And may properly lavish time and trouble thereupon. It is not arguable that glossy buttons are a valid feature of the garb of a humdrum and harassed hospital, orderly many a time."], ["660", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>And may properly lavish time and sport upon it is not improbable that glossy buttons are a valid feature of the garb of a humdrum and harassed hospital superintendent many intellect<|im_end|>", 0.4479951858520508, 1.2192050218582153, "And may properly lavish time and trouble thereupon. It is not arguable that glossy buttons are a valid feature of the garb of a humdrum and harassed hospital, orderly many a time."], ["660", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>And may properly lavish time after working hard. It is not improbable that glossy buttons are a valid feature of the garb of a humdrum and harassed hospital employee many intellect.<|im_end|>", 0.35821354389190674, -0.00017242900503333658, "And may properly lavish time and trouble thereupon. It is not arguable that glossy buttons are a valid feature of the garb of a humdrum and harassed hospital, orderly many a time."], ["660", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>And may properly lavish time and sport upon it is not improbable that glossy buttons are a valid feature of the garb of a humdrum and grassy hospital porter many intellect.<|im_end|>", 0.35880690813064575, 0.007886400446295738, "And may properly lavish time and trouble thereupon. It is not arguable that glossy buttons are a valid feature of the garb of a humdrum and harassed hospital, orderly many a time."], ["660", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>And Shahrazad perceived the dawn of day and ceased saying her permitted say, when it was the six hundred and seventy seventh night she pursued, it hath reached me o auspicious king that when the kafirs fell upon harib.<|im_end|>", 0.6396347880363464, 0.0463232584297657, "And shahrazad perceived the dawn of day and ceased saying her permitted say. When it was the six hundred and seventy seventh night, she pursued it. Hath reached me o auspicious king, that when the kafirs fell upon gharib."], ["660", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>And Shahrazad perceived the dawn of day and ceased saying her permitted say, when it was the six hundred and seventy seventh night she pursued, it hath reached me o auspicious king that when the kaffirs fell upon harib.<|im_end|>", 0.5678775310516357, -1.2670694589614868, "And shahrazad perceived the dawn of day and ceased saying her permitted say. When it was the six hundred and seventy seventh night, she pursued it. Hath reached me o auspicious king, that when the kafirs fell upon gharib."], ["660", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>And Shahrazad perceived the dawn of day and ceased saying her permitted say, when it was the six hundred and seventy seventh night, she pursued. It hath reached me, O auspicious king, that when the kafirs fell upon Harib.<|im_end|>", 0.7012686133384705, 1.1744240522384644, "And shahrazad perceived the dawn of day and ceased saying her permitted say. When it was the six hundred and seventy seventh night, she pursued it. Hath reached me o auspicious king, that when the kafirs fell upon gharib."], ["660", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>And Shahrazad perceived the dawn of day and ceased saying her permitted say, when it was the six hundred and seventy seventh night she pursued. It hath reached me o auspicious king that when the kafirs fell upon harib.<|im_end|>", 0.6396347880363464, 0.0463232584297657, "And shahrazad perceived the dawn of day and ceased saying her permitted say. When it was the six hundred and seventy seventh night, she pursued it. Hath reached me o auspicious king, that when the kafirs fell upon gharib."], ["660", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>these he would make reply but was from a certain person whom perhaps we need not name then the whiskey bottle would move forward like a pawn in chess and the next soothing words would be<|im_end|>", 0.8178245425224304, 0.502872109413147, "deasey would make reply but twas from a certain person whom perhaps we need not name then the whiskey bottle would move forward like a pawn in chess and the next soothing words would be"], ["660", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>beasy would make reply but was from a certain person whom perhaps we need not name then the whiskey bottle would move forward like a pawn in chess and the next soothing words would be<|im_end|>", 0.8717525601387024, 0.8038002252578735, "deasey would make reply but twas from a certain person whom perhaps we need not name then the whiskey bottle would move forward like a pawn in chess and the next soothing words would be"], ["660", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>these he would make reply but was from a certain person whom perhaps we need not name then the whiskey bottle would move forward like upon in chest and the next soothing words repeat<|im_end|>", 0.4692924916744232, -1.4420000314712524, "deasey would make reply but twas from a certain person whom perhaps we need not name then the whiskey bottle would move forward like a pawn in chess and the next soothing words would be"], ["660", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>these he would make reply but was from a certain person whom perhaps we need not name then the whiskey bottle would move forward like a pawn in chess and the next suiting words would be<|im_end|>", 0.7519586086273193, 0.13532821834087372, "deasey would make reply but twas from a certain person whom perhaps we need not name then the whiskey bottle would move forward like a pawn in chess and the next soothing words would be"], ["660", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>He did, in fact, begin it when setting out on the aforementioned second trip to Europe, calling it.<|im_end|>", 1.0, 0.49922850728034973, "He did, in fact, begin it when setting out on the aforementioned second trip to europe, calling it."], ["660", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>He did, in fact, begin it when setting out on the aforementioned second trip to Europe, calling it.<|im_end|>", 1.0, 0.49922850728034973, "He did, in fact, begin it when setting out on the aforementioned second trip to europe, calling it."], ["660", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>He did, in fact, begin it when setting out on the aforementioned second trip to Europe, calling it.<|im_end|>", 1.0, 0.49922850728034973, "He did, in fact, begin it when setting out on the aforementioned second trip to europe, calling it."], ["660", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>He did, in fact begin it when setting out on the aforementioned second trip to Europe, calling it.<|im_end|>", 0.8706542253494263, -1.4976837635040283, "He did, in fact, begin it when setting out on the aforementioned second trip to europe, calling it."], ["660", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Bayard knew that his master was upon him, and he started off upon a rapid pace. And in a few moments, he had good run up. Malagigi pretended to be in great alarm. O noble king and master, he cried, my poor companion has run away with. He will fall and break his neck.<|im_end|>", 0.4922104775905609, -0.6293519735336304, "Bayard knew that his master was upon him, and he started off upon a rapid pace, and in a few moments was a good way off. Malagigi pretended to be in great alarm o, noble king and master. He cried, my poor companion is run away with he will fall and break his neck."], ["660", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Bayard knew that his master was upon him, and he started off upon a rapid pace. And in a few moments, he had galloped away. Malagigi pretended to be in great alarm. O noble king and master, he cried, my poor companion has run away with me. He will fall and break his neck.<|im_end|>", 0.4565129280090332, -1.024836540222168, "Bayard knew that his master was upon him, and he started off upon a rapid pace, and in a few moments was a good way off. Malagigi pretended to be in great alarm o, noble king and master. He cried, my poor companion is run away with he will fall and break his neck."], ["660", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Bayard knew that his master was upon him, and he started off upon a rapid pace. And in a few moments of a good way up. Malagigi pretended to be in great alarm. O noble king and master, he cried, my poor companion has run away with. He will fall and break his neck.<|im_end|>", 0.6506629586219788, 1.1261051893234253, "Bayard knew that his master was upon him, and he started off upon a rapid pace, and in a few moments was a good way off. Malagigi pretended to be in great alarm o, noble king and master. He cried, my poor companion is run away with he will fall and break his neck."], ["660", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Bayard knew that his master was upon him, and he started off upon a rapid pace. And in a few moments of a good run up, Malagigi pretended to be in great alarm. O noble king and master, he cried, my poor companion has run away with. He will fall and break his neck.<|im_end|>", 0.5966837406158447, 0.5280823707580566, "Bayard knew that his master was upon him, and he started off upon a rapid pace, and in a few moments was a good way off. Malagigi pretended to be in great alarm o, noble king and master. He cried, my poor companion is run away with he will fall and break his neck."], ["660", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>She laid a firm, delicate hand on her gold green jerkin. Ellador, this was pleasant, but we got no nearer. We can't sit here and learn the language. Terry protested.<|im_end|>", 1.0, 1.3054163455963135, "She laid a firm, delicate hand on her gold green jerkin. Ellador, this was pleasant, but we got no nearer. We can't sit here and learn the language. Terry protested."], ["660", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>She laid a firm, delicate hand on her gold green jerkin ellador. This was pleasant, but we got no nearer. We can't sit here and learn the language. Terry protested.<|im_end|>", 0.8441234230995178, -0.7815061807632446, "She laid a firm, delicate hand on her gold green jerkin. Ellador, this was pleasant, but we got no nearer. We can't sit here and learn the language. Terry protested."], ["660", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>She laid a firm, delicate hand on her gold green jerkin. Ellador. This was pleasant, but we got no nearer. We can't sit here and learn the language. Terry protested.<|im_end|>", 0.9217362999916077, 0.2575983703136444, "She laid a firm, delicate hand on her gold green jerkin. Ellador, this was pleasant, but we got no nearer. We can't sit here and learn the language. Terry protested."], ["660", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>She laid a firm, delicate hand on her gold green jerkin ellador. This was pleasant, but we got no nearer. We can't sit here and learn the language. Terry protested.<|im_end|>", 0.8441234230995178, -0.7815061807632446, "She laid a firm, delicate hand on her gold green jerkin. Ellador, this was pleasant, but we got no nearer. We can't sit here and learn the language. Terry protested."], ["660", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>he cried out sadly and fought and struggled two minutes however he did little against his tormentors and worn out with his struggle plats suddenly went from dusty boy with emotion in his spirit lost lost he muttered all lost<|im_end|>", -0.15980112552642822, -0.0070180995389819145, "he cried out savagely and fought with the strength of two men however he could do little against his four adversaries and worn out with the struggle collapsed suddenly on to the dusty floor with a motion of despair lost lost he muttered all lost"], ["660", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>he cried out sadly and fought and struggled two minutes however he did little against his tormentors and worn out with his struggle platt suddenly on the dusty floor with emotion in his spirit lost lost he muttered all lost<|im_end|>", 0.03230888023972511, 0.7638584971427917, "he cried out savagely and fought with the strength of two men however he could do little against his four adversaries and worn out with the struggle collapsed suddenly on to the dusty floor with a motion of despair lost lost he muttered all lost"], ["660", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>he cried out sadly and fought and struggled to win it however he did little against his tormentors and wore down with his struggle plaid suddenly went from dusty boy with emotion in his spirit lost, lost, he muttered all lost<|im_end|>", -0.5093984603881836, -1.409841537475586, "he cried out savagely and fought with the strength of two men however he could do little against his four adversaries and worn out with the struggle collapsed suddenly on to the dusty floor with a motion of despair lost lost he muttered all lost"], ["660", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>he cried out sadly and fought and struggled two minutes however he did little against four adversaries and worn out with his struggle clapp suddenly on the dusty floor in motionless terror lost lost he muttered all lost<|im_end|>", 0.004682107362896204, 0.653001070022583, "he cried out savagely and fought with the strength of two men however he could do little against his four adversaries and worn out with the struggle collapsed suddenly on to the dusty floor with a motion of despair lost lost he muttered all lost"], ["660", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>and thus he accomplished this by the bye during the siege of the city, for he had his enemies in great contempt already nine when he had thus married mariamne.<|im_end|>", 0.715508222579956, 0.49875012040138245, "And thus he accomplished this by the by, during the siege of the city. For he had his enemies in great contempt already nine when he had thus married mariamne, he."], ["660", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>and thus he accomplished this by the bye during the siege of the city, for he had his enemies in great contempt already nine when he had thus married mariamne.<|im_end|>", 0.715508222579956, 0.49875012040138245, "And thus he accomplished this by the by, during the siege of the city. For he had his enemies in great contempt already nine when he had thus married mariamne, he."], ["660", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>And thus he accomplished this by the bye during the siege of the city, for he had his enemies in great contempt already. Nine when he had thus married Mariamne.<|im_end|>", 0.6356512308120728, -1.4962533712387085, "And thus he accomplished this by the by, during the siege of the city. For he had his enemies in great contempt already nine when he had thus married mariamne, he."], ["660", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>and thus he accomplished this by the bye during the siege of the city, for he had his enemies in great contempt already nine when he had thus married mariamne.<|im_end|>", 0.715508222579956, 0.49875012040138245, "And thus he accomplished this by the by, during the siege of the city. For he had his enemies in great contempt already nine when he had thus married mariamne, he."], ["660", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Putting both hands on her shoulders and looking into the brown eyes, should you be willing to go abroad with your mother and phronsie? Mister king and jasper oh polly gasped but you.<|im_end|>", 0.7173033952713013, -0.7722386121749878, "Putting both hands on her shoulders and looking into the brown eyes, should you be willing to go abroad with your mother and phronsie, mister king and jasper? Oh, polly gasped, but you."], ["660", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Putting both hands on her shoulders and looking into the brown eyes, should you be willing to go abroad with your mother and phronsie? Mister king and jasper. Oh Polly gasped. But you.<|im_end|>", 0.7161594033241272, -0.7890278100967407, "Putting both hands on her shoulders and looking into the brown eyes, should you be willing to go abroad with your mother and phronsie, mister king and jasper? Oh, polly gasped, but you."], ["660", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Putting both hands on her shoulders and looking into the brown eyes, should you be willing to go abroad with your mother and phronsie? Mister king and jasper. Oh Polly gasped, but you.<|im_end|>", 0.7872677445411682, 0.25455793738365173, "Putting both hands on her shoulders and looking into the brown eyes, should you be willing to go abroad with your mother and phronsie, mister king and jasper? Oh, polly gasped, but you."], ["660", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Putting both hands on her shoulders and looking into the brown eyes, should you be willing to go abroad with your mother and phronsie, mister king and jasper? Oh Polly gasped but you.<|im_end|>", 0.8589596152305603, 1.3067076206207275, "Putting both hands on her shoulders and looking into the brown eyes, should you be willing to go abroad with your mother and phronsie, mister king and jasper? Oh, polly gasped, but you."]]}
|
wandb/run-20260418_172847-c2a5hfz3/files/media/table/completions_335_3461640c297d6819a123.table.json
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"columns": ["step", "prompt", "completion", "ASRWerSubLenCmpHalluDirtyV56", "advantages", "solution"], "data": [["670", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Are any other beings ever found in such masses but armor, anus, scaly and naked? Look at them.<|im_end|>", 0.10128102451562881, 0.9727044701576233, "Are any other beings ever found in such masses? But vermin, aimless, staring, vacant minded. Look at them."], ["670", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Are any other beings ever found in such masses of iron, anus, stone and great granite? Look at them.<|im_end|>", -0.21537110209465027, -0.9686115980148315, "Are any other beings ever found in such masses? But vermin, aimless, staring, vacant minded. Look at them."], ["670", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Are any other beings ever found in such masses but armor, anus, scale and great and round? Look at them.<|im_end|>", -0.17419415712356567, -0.7161659002304077, "Are any other beings ever found in such masses? But vermin, aimless, staring, vacant minded. Look at them."], ["670", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Are any other beings ever found in such masses but iron, a mis, stone? Great and grand. Look at them.<|im_end|>", -0.16917581856250763, -0.6853997111320496, "Are any other beings ever found in such masses? But vermin, aimless, staring, vacant minded. Look at them."], ["670", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Are any other beings ever found in such masses of iron, anus, stone and great granite? Look at them.<|im_end|>", -0.21537110209465027, -0.9686115980148315, "Are any other beings ever found in such masses? But vermin, aimless, staring, vacant minded. Look at them."], ["670", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Are any other beings ever found in such masses, but armor? Anus, scaly and naked. Look at them.<|im_end|>", 0.10200562328100204, 0.9771468043327332, "Are any other beings ever found in such masses? But vermin, aimless, staring, vacant minded. Look at them."], ["670", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Are any other beings ever found in such masses, but armor, anus, scale and great and round it? Look at them.<|im_end|>", -0.35615864396095276, -1.8317453861236572, "Are any other beings ever found in such masses? But vermin, aimless, staring, vacant minded. Look at them."], ["670", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Are any other beings ever found in such masses but armor, anus, scaly and naked? Look at them.<|im_end|>", 0.10128102451562881, 0.9727044701576233, "Are any other beings ever found in such masses? But vermin, aimless, staring, vacant minded. Look at them."], ["670", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Are any other beings ever found in such masses but armor, anus, stamen and great gland? Look at them.<|im_end|>", -0.035287097096443176, 0.13543902337551117, "Are any other beings ever found in such masses? But vermin, aimless, staring, vacant minded. Look at them."], ["670", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Are any other beings ever found in such masses but armor, anus, scaly and naked minded? Look at them.<|im_end|>", -0.028729775920510292, 0.17564034461975098, "Are any other beings ever found in such masses? But vermin, aimless, staring, vacant minded. Look at them."], ["670", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Are any other beings ever found in such masses but armor anus, scaly and naked? Look at them.<|im_end|>", 0.09989295154809952, 0.9641945362091064, "Are any other beings ever found in such masses? But vermin, aimless, staring, vacant minded. Look at them."], ["670", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Are any other beings ever found in such masses but armor, anus, scaly and naked? Look at them.<|im_end|>", 0.10128102451562881, 0.9727044701576233, "Are any other beings ever found in such masses? But vermin, aimless, staring, vacant minded. Look at them."], ["670", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>in which both of them seated without either audience for nothing had been said on either side between them to slight each other less than they had done before and elizabeth asked her parting with a melancholy persuasion that edward was not only without affection for the person who was to be his bride<|im_end|>", 0.2575233578681946, 0.4609338343143463, "to which both of them submitted without any reluctance for nothing had been said on either side to make them dislike each other less than they had done before and elinor sat down to the card table with the melancholy persuasion that edward was not only without affection for the person who was to be his wife"], ["670", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>in which both of them seated without either audience for nothing it could be said on either side that they disliked each other less than they had done before and elizabeth asked for parting with a melancholy persuasion that edward was not only without affection for the person who was to be his bride<|im_end|>", 0.1251828372478485, -1.8440135717391968, "to which both of them submitted without any reluctance for nothing had been said on either side to make them dislike each other less than they had done before and elinor sat down to the card table with the melancholy persuasion that edward was not only without affection for the person who was to be his wife"], ["670", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>in which both of them seated without either audience for nothing it can say on either side had made them dislike each other less than they had done before and elizabeth asked her partake with a melancholy persuasion that edward was not only without affection for the person who was his wife<|im_end|>", 0.17267856001853943, -1.0167903900146484, "to which both of them submitted without any reluctance for nothing had been said on either side to make them dislike each other less than they had done before and elinor sat down to the card table with the melancholy persuasion that edward was not only without affection for the person who was to be his wife"], ["670", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>in which both of them sitted without either utterance for nothing had been said on either side except from dislike each other less than they had done before and elizabeth asked her partaker with a melancholy persuasion that edward was not only without affection for the person who was speaking his mind<|im_end|>", 0.21673797070980072, -0.249416783452034, "to which both of them submitted without any reluctance for nothing had been said on either side to make them dislike each other less than they had done before and elinor sat down to the card table with the melancholy persuasion that edward was not only without affection for the person who was to be his wife"], ["670", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>in which both of them seated without either audience for nothing had been said on either side except from dislike each other less than they had done before and elizabeth asked her parting with a melancholy persuasion that edward was not only without affection for the person who was his wife<|im_end|>", 0.26496413350105286, 0.5905282497406006, "to which both of them submitted without any reluctance for nothing had been said on either side to make them dislike each other less than they had done before and elinor sat down to the card table with the melancholy persuasion that edward was not only without affection for the person who was to be his wife"], ["670", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>in which both of them seated without either audience for nothing it could said on either side made them dislike each other less than they had done before and elizabeth asked for parting with a melancholy persuasion that edward was not only without affection for the person who was to be his bride<|im_end|>", 0.26157763600349426, 0.5315463542938232, "to which both of them submitted without any reluctance for nothing had been said on either side to make them dislike each other less than they had done before and elinor sat down to the card table with the melancholy persuasion that edward was not only without affection for the person who was to be his wife"], ["670", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>in which both of them seated without either audience for nothing it had said on either side made them dislike each other less than they had done before and elizabeth asked her partaking with a melancholy persuasion that edward was not only without affection for the person who was to be his bride<|im_end|>", 0.26304858922958374, 0.5571656227111816, "to which both of them submitted without any reluctance for nothing had been said on either side to make them dislike each other less than they had done before and elinor sat down to the card table with the melancholy persuasion that edward was not only without affection for the person who was to be his wife"], ["670", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>in which both of them succeeded without either arguments for nothing it had said on either side could make them dislike each other less than they had done before and elizabeth asked her parting with a melancholy resiliation that edward was not only without affection for the person who was keeping his mind<|im_end|>", 0.1625610888004303, -1.1930042505264282, "to which both of them submitted without any reluctance for nothing had been said on either side to make them dislike each other less than they had done before and elinor sat down to the card table with the melancholy persuasion that edward was not only without affection for the person who was to be his wife"], ["670", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>in which both of them seated without either audience for nothing had been said on either side except in dislike each other less than they had done before and elizabeth asked her partake with a melancholy persuasion that edward was not only without affection for the person who was to be his bride<|im_end|>", 0.30962347984313965, 1.368350863456726, "to which both of them submitted without any reluctance for nothing had been said on either side to make them dislike each other less than they had done before and elinor sat down to the card table with the melancholy persuasion that edward was not only without affection for the person who was to be his wife"], ["670", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>in which both of them sitted without either audience for nothing had been said on either side except what was like each other less than they had done before and elizabeth asked her partaking with a melancholy persuasion that edward was not only without affection for the person who was his wife<|im_end|>", 0.21824409067630768, -0.2231850028038025, "to which both of them submitted without any reluctance for nothing had been said on either side to make them dislike each other less than they had done before and elinor sat down to the card table with the melancholy persuasion that edward was not only without affection for the person who was to be his wife"], ["670", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>in which both of them seated without either audience for nothing had been said on either side except from dislike each other less than they had done before nelly lost asked to partake with a melancholy persuasion that edward was not only without affection for the person who was to be his bride<|im_end|>", 0.30912715196609497, 1.3597064018249512, "to which both of them submitted without any reluctance for nothing had been said on either side to make them dislike each other less than they had done before and elinor sat down to the card table with the melancholy persuasion that edward was not only without affection for the person who was to be his wife"], ["670", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>in which both of them succeeded without either audience for nothing had been said on either side between the sight each other less than they had done before and elizabeth asked her parting with a melancholy resiliation that edward was not only without affection for the person who was to be his bride<|im_end|>", 0.2114323079586029, -0.34182441234588623, "to which both of them submitted without any reluctance for nothing had been said on either side to make them dislike each other less than they had done before and elinor sat down to the card table with the melancholy persuasion that edward was not only without affection for the person who was to be his wife"], ["670", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>And they've just been ordered a small pot of ginger, then please, said Barbara quickly. Will you send it round immediately? Yes, ma'am. The boy's just going out. Thank you, ma'am.<|im_end|>", 0.4192619323730469, 1.2368416786193848, "And they've just been ordered a small pot of ginger then, please, said diva, recklessly. Will you send it round immediately? Yes, ma'am. The boy's just going out. That was luck."], ["670", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>And they've just been ordered a small pot of ginger, then please. Without a requisition. Will you send it round immediately? Yes, ma'am. The boys just going out. That's what.<|im_end|>", 0.15900462865829468, -0.6233274340629578, "And they've just been ordered a small pot of ginger then, please, said diva, recklessly. Will you send it round immediately? Yes, ma'am. The boy's just going out. That was luck."], ["670", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>And they've just been ordered a small pot of ginger then, please, if I'd rather have it sweet? Will you send it round immediately? Yes, ma'am. The boy's just going out. That'll be about.<|im_end|>", 0.27937445044517517, 0.23700663447380066, "And they've just been ordered a small pot of ginger then, please, said diva, recklessly. Will you send it round immediately? Yes, ma'am. The boy's just going out. That was luck."], ["670", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>And they've just been ordered a small pot of ginger, then please, said Datterley softly. Will you send it round immediately? Yes, ma'am. The boys just going out. Thank you, mother.<|im_end|>", 0.32857972383499146, 0.5886975526809692, "And they've just been ordered a small pot of ginger then, please, said diva, recklessly. Will you send it round immediately? Yes, ma'am. The boy's just going out. That was luck."], ["670", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>And that's just been ordered a small pot of ginger, then please, without a requisition. Will you send it round immediately? Yes, ma'am. The boys just going out. That is well.<|im_end|>", 0.22822655737400055, -0.12856899201869965, "And they've just been ordered a small pot of ginger then, please, said diva, recklessly. Will you send it round immediately? Yes, ma'am. The boy's just going out. That was luck."], ["670", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>And they've just been ordered a small pot of ginger, then please. I'd rather have it soon. Will you send it round immediately? Yes, ma'am. The boy's just going out. Thank you, ma'am.<|im_end|>", 0.08186985552310944, -1.1746423244476318, "And they've just been ordered a small pot of ginger then, please, said diva, recklessly. Will you send it round immediately? Yes, ma'am. The boy's just going out. That was luck."], ["670", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>And they've just been ordered a small pot of ginger, then please said datterley quickly. Will you send it round immediately? Yes, ma'am. The boy's just going out. Thank you. Well.<|im_end|>", 0.33202850818634033, 0.6133474707603455, "And they've just been ordered a small pot of ginger then, please, said diva, recklessly. Will you send it round immediately? Yes, ma'am. The boy's just going out. That was luck."], ["670", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>And that's just been ordered a small pot of ginger, then please. What about a recipe? Will you send it round immediately? Yes, ma'am. The boys just going out. Thank you. Well.<|im_end|>", -0.03146732226014137, -1.9847110509872437, "And they've just been ordered a small pot of ginger then, please, said diva, recklessly. Will you send it round immediately? Yes, ma'am. The boy's just going out. That was luck."], ["670", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>And they've just been ordered a small pot of ginger, then please if that'll reconcile. Will you send it round immediately? Yes, ma'am. The boy's just going out. Thank you, ma'am.<|im_end|>", 0.23466002941131592, -0.08258624374866486, "And they've just been ordered a small pot of ginger then, please, said diva, recklessly. Will you send it round immediately? Yes, ma'am. The boy's just going out. That was luck."], ["670", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>And that's just been ordered a small pot of ginger, then please without a recipe. Will you send it round immediately? Yes, ma'am. The boy's just going out. Thank you, papa.<|im_end|>", 0.14090721309185028, -0.752677321434021, "And they've just been ordered a small pot of ginger then, please, said diva, recklessly. Will you send it round immediately? Yes, ma'am. The boy's just going out. That was luck."], ["670", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>And they've just been ordered a small pot of ginger, then please, said the doctor rapidly. Will you send it round immediately? Yes, ma'am, the boy's just going out. That is well.<|im_end|>", 0.34315091371536255, 0.692844033241272, "And they've just been ordered a small pot of ginger then, please, said diva, recklessly. Will you send it round immediately? Yes, ma'am. The boy's just going out. That was luck."], ["670", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>And they've just been ordered a small pot of ginger, then please, said datterley hastily. Will you send it round immediately? Yes, ma'am. The boy's just going out. That's well.<|im_end|>", 0.4389801323413849, 1.377776026725769, "And they've just been ordered a small pot of ginger then, please, said diva, recklessly. Will you send it round immediately? Yes, ma'am. The boy's just going out. That was luck."], ["670", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>I don't want to be you, for I am not, and yet there is one thing that I forbear to mourn them.<|im_end|>", -1.3294343948364258, -1.4924614429473877, "You don't believe it, do you? Watson, no, no. And yet, it was one thing to laugh about it in london."], ["670", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>He demanded, \"Do you have a hat?\". I had one, and yet there was one thing that I forgot to mention.<|im_end|>", -1.2909154891967773, -1.3791276216506958, "You don't believe it, do you? Watson, no, no. And yet, it was one thing to laugh about it in london."], ["670", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>He declared to you, of course, I am here and yet there is one thing to laugh about in London.<|im_end|>", -0.8068205714225769, 0.04522077739238739, "You don't believe it, do you? Watson, no, no. And yet, it was one thing to laugh about it in london."], ["670", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>He did not believe it, and yet there was one thing to laugh about in London.<|im_end|>", -0.3995647430419922, 1.2434861660003662, "You don't believe it, do you? Watson, no, no. And yet, it was one thing to laugh about it in london."], ["670", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>He thought, but he knew of it all, and yet there was one thing to laugh about in London.<|im_end|>", -0.6124812364578247, 0.617023766040802, "You don't believe it, do you? Watson, no, no. And yet, it was one thing to laugh about it in london."], ["670", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>He declared, be you what you will and yet there is one thing to laugh about it in London.<|im_end|>", -0.6049650311470032, 0.6391386389732361, "You don't believe it, do you? Watson, no, no. And yet, it was one thing to laugh about it in london."], ["670", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>He declared to you, he said, I am ill, and yet there is one thing to laugh about in London.<|im_end|>", -0.807164192199707, 0.04420974478125572, "You don't believe it, do you? Watson, no, no. And yet, it was one thing to laugh about it in london."], ["670", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>He replied, but do you want to help me in that? And yet there is one thing to laugh about it in London.<|im_end|>", -0.9126564264297485, -0.2661791741847992, "You don't believe it, do you? Watson, no, no. And yet, it was one thing to laugh about it in london."], ["670", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>He had been a victim of hope, and yet there was one thing to laugh about it in London.<|im_end|>", -0.4558258652687073, 1.0779495239257812, "You don't believe it, do you? Watson, no, no. And yet, it was one thing to laugh about it in london."], ["670", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>He complained, but he was hotly in love. And yet there is one thing that I forgot to mention.<|im_end|>", -1.290951132774353, -1.3792325258255005, "You don't believe it, do you? Watson, no, no. And yet, it was one thing to laugh about it in london."], ["670", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>He declared, \"Do you think I am ill? And yet there is one thing to laugh about in London.\"<|im_end|>", -0.9214498996734619, -0.29205214977264404, "You don't believe it, do you? Watson, no, no. And yet, it was one thing to laugh about it in london."], ["670", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>I don't believe you, sir. I know it, and yet there is one thing to laugh about in London.<|im_end|>", -0.434049129486084, 1.1420230865478516, "You don't believe it, do you? Watson, no, no. And yet, it was one thing to laugh about it in london."]]}
|
wandb/run-20260418_172847-c2a5hfz3/files/media/table/completions_411_885808c4b4bd708583eb.table.json
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"columns": ["step", "prompt", "completion", "ASRWerSubLenCmpHalluDirtyV56", "advantages", "solution"], "data": [["820", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Captain markham, it's about about my wife. Polly answered, casting down her eyes and returning a very red. The other day, the whistle.<|im_end|>", 0.1822807341814041, -0.6647002696990967, "Captain marker, it's about about my wife. Crawley answered, casting down his eyes and turning very red. The other gave a whistle."], ["820", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Captain martin, it's about about my wife, crawley answered, casting down his eyes and returning a very red. The other day, the whistle.<|im_end|>", 0.3173089027404785, -0.11428264528512955, "Captain marker, it's about about my wife. Crawley answered, casting down his eyes and turning very red. The other gave a whistle."], ["820", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Captain marten, it's about about my wife. Crawley answered, casting down his eyes and returning a very red. The other gave a whistle.<|im_end|>", 0.7004733681678772, 1.4476171731948853, "Captain marker, it's about about my wife. Crawley answered, casting down his eyes and turning very red. The other gave a whistle."], ["820", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Captain martin, it's about about my wife. Polly answered, casting down her eyes and returning a very red. The other day, the whistle.<|im_end|>", 0.1813155859708786, -0.6686345338821411, "Captain marker, it's about about my wife. Crawley answered, casting down his eyes and turning very red. The other gave a whistle."], ["820", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>At evening upon the world, while others hint that knowledge of these might undo our civilization. There watched him ceaselessly from the underpits those eyes whose duty it is from further within and deeper.<|im_end|>", 0.8152623176574707, -1.2966564893722534, "At evening upon the world, while others hint that knowledge of these might undo our civilization, there watched him ceaselessly from the under pits, those eyes whose duty it is from further within and deeper."], ["820", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>At evening upon the world, while others hint that knowledge of these might undo our civilization, there watched him ceaselessly from the under pits those eyes whose duty it is from further within and deeper.<|im_end|>", 0.9336058497428894, 1.1373971700668335, "At evening upon the world, while others hint that knowledge of these might undo our civilization, there watched him ceaselessly from the under pits, those eyes whose duty it is from further within and deeper."], ["820", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>At evening upon the world, while others hint that knowledge of these might undo our civilization, there watched him ceaselessly from the underpits those eyes whose duty it is from further within and deeper.<|im_end|>", 0.8821772933006287, 0.0796302929520607, "At evening upon the world, while others hint that knowledge of these might undo our civilization, there watched him ceaselessly from the under pits, those eyes whose duty it is from further within and deeper."], ["820", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>At evening upon the world, while others hint that knowledge of these might undo our civilization, there watched him ceaselessly from the underpits those eyes whose duty it is from further within and deeper.<|im_end|>", 0.8821772933006287, 0.0796302929520607, "At evening upon the world, while others hint that knowledge of these might undo our civilization, there watched him ceaselessly from the under pits, those eyes whose duty it is from further within and deeper."], ["820", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Milly steered her magnificent way like some great liner cleaving among the canoes of howling savages. Our goddess of grub was built on lines so majestic that they could be followed only with awe.<|im_end|>", 1.0, 0.0, "Milly steered her magnificent way like some great liner cleaving among the canoes of howling savages. Our goddess of grub was built on lines so majestic that they could be followed only with awe."], ["820", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Milly steered her magnificent way like some great liner cleaving among the canoes of howling savages. Our goddess of grub was built on lines so majestic that they could be followed only with awe.<|im_end|>", 1.0, 0.0, "Milly steered her magnificent way like some great liner cleaving among the canoes of howling savages. Our goddess of grub was built on lines so majestic that they could be followed only with awe."], ["820", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Milly steered her magnificent way like some great liner cleaving among the canoes of howling savages. Our goddess of grub was built on lines so majestic that they could be followed only with awe.<|im_end|>", 1.0, 0.0, "Milly steered her magnificent way like some great liner cleaving among the canoes of howling savages. Our goddess of grub was built on lines so majestic that they could be followed only with awe."], ["820", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Milly steered her magnificent way like some great liner cleaving among the canoes of howling savages. Our goddess of grub was built on lines so majestic that they could be followed only with awe.<|im_end|>", 1.0, 0.0, "Milly steered her magnificent way like some great liner cleaving among the canoes of howling savages. Our goddess of grub was built on lines so majestic that they could be followed only with awe."], ["820", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>And may properly lavish time and store it upon. It is not improbable that glossy buttons are a valid feature of the garb of a humdrum and harassed hospital porter many intellect.<|im_end|>", 0.38166147470474243, 0.8561707735061646, "And may properly lavish time and trouble thereupon. It is not arguable that glossy buttons are a valid feature of the garb of a humdrum and harassed hospital, orderly many a time."], ["820", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>And may properly lavish time and reward him upon it is not improbable that glossy buttons are a valid feature of the garb of a humdrum and grassy hospital porter many intellect.<|im_end|>", 0.2887856066226959, 0.24522322416305542, "And may properly lavish time and trouble thereupon. It is not arguable that glossy buttons are a valid feature of the garb of a humdrum and harassed hospital, orderly many a time."], ["820", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>And may properly lavish time and store their money in it is not improbable that glossy buttons are a valid feature of the garb of a humdrum and harassed hospital portmanteau many intellect.<|im_end|>", 0.30360567569732666, 0.3427112400531769, "And may properly lavish time and trouble thereupon. It is not arguable that glossy buttons are a valid feature of the garb of a humdrum and harassed hospital, orderly many a time."], ["820", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>And may properly lavish time at his work of art. It is not improbable that glossy buttons are a valid feature in the garb of a humdrum and grassy hospital wardrobes many intellect.<|im_end|>", 0.031974904239177704, -1.4441053867340088, "And may properly lavish time and trouble thereupon. It is not arguable that glossy buttons are a valid feature of the garb of a humdrum and harassed hospital, orderly many a time."], ["820", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>And shahrazad perceived the dawn of day and ceased saying her permitted say, when it was the six hundred and seventy seventh night she pursued, it hath reached me o auspicious king that when the kafirs fell upon harib.<|im_end|>", 0.6396347880363464, -0.8913764357566833, "And shahrazad perceived the dawn of day and ceased saying her permitted say. When it was the six hundred and seventy seventh night, she pursued it. Hath reached me o auspicious king, that when the kafirs fell upon gharib."], ["820", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>And shahrazad perceived the dawn of day and ceased saying her permitted say, when it was the six hundred and seventy seventh night, she pursued it hath reached me o auspicious king that when the kafirs fell upon harib.<|im_end|>", 0.7608726620674133, 1.3088793754577637, "And shahrazad perceived the dawn of day and ceased saying her permitted say. When it was the six hundred and seventy seventh night, she pursued it. Hath reached me o auspicious king, that when the kafirs fell upon gharib."], ["820", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>And shahrazad perceived the dawn of day and ceased saying her permitted say when it was the six hundred and seventy seventh night, she pursued. It hath reached me o auspicious king that when the kafirs fell upon harib.<|im_end|>", 0.7017130255699158, 0.23523521423339844, "And shahrazad perceived the dawn of day and ceased saying her permitted say. When it was the six hundred and seventy seventh night, she pursued it. Hath reached me o auspicious king, that when the kafirs fell upon gharib."], ["820", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>And Shahrazad perceived the dawn of day and ceased saying her permitted say when it was the six hundred seventy seventh night, she pursued it hath reached me o auspicious king that when the kaffirs fell upon harib.<|im_end|>", 0.6527841091156006, -0.6527392268180847, "And shahrazad perceived the dawn of day and ceased saying her permitted say. When it was the six hundred and seventy seventh night, she pursued it. Hath reached me o auspicious king, that when the kafirs fell upon gharib."], ["820", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>these he would make reply but was from a certain person whom perhaps we need not name then the whiskey bottle would move forward like a pawn in chess and the next suited words would be<|im_end|>", 0.74958735704422, 0.16212931275367737, "deasey would make reply but twas from a certain person whom perhaps we need not name then the whiskey bottle would move forward like a pawn in chess and the next soothing words would be"], ["820", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>these he would make reply, but was found on a certain person whom perhaps we need not name. Then the whiskey bottle would move forward like a pawn in chess and the next soothing words would be<|im_end|>", 0.5462133884429932, -1.4572458267211914, "deasey would make reply but twas from a certain person whom perhaps we need not name then the whiskey bottle would move forward like a pawn in chess and the next soothing words would be"], ["820", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>these he would make reply but was from a certain person whom perhaps we need not name then the whiskey bottle would move forward like a pawn in chess and the next soothing words would be<|im_end|>", 0.8178245425224304, 0.7054712176322937, "deasey would make reply but twas from a certain person whom perhaps we need not name then the whiskey bottle would move forward like a pawn in chess and the next soothing words would be"], ["820", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>easy would make reply but was from a certain person whom perhaps we need not name then the whiskey bottle would move forward like a pawn in chess and the next suited words would be<|im_end|>", 0.8032783269882202, 0.5896462798118591, "deasey would make reply but twas from a certain person whom perhaps we need not name then the whiskey bottle would move forward like a pawn in chess and the next soothing words would be"], ["820", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>He did in fact begin it when setting out on the aforementioned second trip to europe, calling it.<|im_end|>", 0.7412750124931335, 0.0, "He did, in fact, begin it when setting out on the aforementioned second trip to europe, calling it."], ["820", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>He did in fact begin it when setting out on the aforementioned second trip to europe, calling it.<|im_end|>", 0.7412750124931335, 0.0, "He did, in fact, begin it when setting out on the aforementioned second trip to europe, calling it."], ["820", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>He did in fact begin it when setting out on the aforementioned second trip to europe, calling it.<|im_end|>", 0.7412750124931335, 0.0, "He did, in fact, begin it when setting out on the aforementioned second trip to europe, calling it."], ["820", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>He did in fact begin it when setting out on the aforementioned second trip to Europe, calling it.<|im_end|>", 0.7412750124931335, 0.0, "He did, in fact, begin it when setting out on the aforementioned second trip to europe, calling it."], ["820", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Fayard knew that his master was upon him, and he started off upon a rapid pace. And in a few moments, he had ridden on. Malagigi pretended to be in great alarm. O noble king and master, he cried, my poor companion has run away with me. He will fall and break his neck.<|im_end|>", 0.40350231528282166, 0.19367654621601105, "Bayard knew that his master was upon him, and he started off upon a rapid pace, and in a few moments was a good way off. Malagigi pretended to be in great alarm o, noble king and master. He cried, my poor companion is run away with he will fall and break his neck."], ["820", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Veyard knew that his master was upon him, and he started off upon a rapid pace. And in a few moments, he had got well up. Malagigi pretended to be in great alarm. O noble king and master, he cried, my poor companion has run away with me. He will fall and break his neck.<|im_end|>", 0.3942375183105469, -0.0513581745326519, "Bayard knew that his master was upon him, and he started off upon a rapid pace, and in a few moments was a good way off. Malagigi pretended to be in great alarm o, noble king and master. He cried, my poor companion is run away with he will fall and break his neck."], ["820", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Bayard knew that his master was upon him, and he started off upon a rapid pace. And in a few moments, he had got well up. Malagigi pretended to be in great alarm. O noble king and master, he cried, my poor companion has run away with. He will fall and break his neck.<|im_end|>", 0.4392834007740021, 1.140012264251709, "Bayard knew that his master was upon him, and he started off upon a rapid pace, and in a few moments was a good way off. Malagigi pretended to be in great alarm o, noble king and master. He cried, my poor companion is run away with he will fall and break his neck."], ["820", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Fayard knew that his master was upon him, and he started off upon a rapid pace. And in a few moments, he had gone on maledijiji. Pretended to be in great alarm. O noble king and master, he cried, my poor companion has run away with me. He will fall and break his neck.<|im_end|>", 0.3476942181587219, -1.282332181930542, "Bayard knew that his master was upon him, and he started off upon a rapid pace, and in a few moments was a good way off. Malagigi pretended to be in great alarm o, noble king and master. He cried, my poor companion is run away with he will fall and break his neck."], ["820", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>She laid a firm, delicate hand on her gold green jerkin. Elidor, this was pleasant, but we got no nearer. We can't sit here and learn the language. Terry protested.<|im_end|>", 0.9210602045059204, -1.0414021015167236, "She laid a firm, delicate hand on her gold green jerkin. Ellador, this was pleasant, but we got no nearer. We can't sit here and learn the language. Terry protested."], ["820", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>She laid a firm, delicate hand on her gold green jerkin. Ellador. This was pleasant, but we got no nearer. We can't sit here and learn the language. Terry protested.<|im_end|>", 0.9217362999916077, 0.006559576839208603, "She laid a firm, delicate hand on her gold green jerkin. Ellador, this was pleasant, but we got no nearer. We can't sit here and learn the language. Terry protested."], ["820", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>She laid a firm, delicate hand on her gold green jerkin. Ellador. This was pleasant, but we got no nearer. We can't sit here and learn the language. Terry protested.<|im_end|>", 0.9217362999916077, 0.006559576839208603, "She laid a firm, delicate hand on her gold green jerkin. Ellador, this was pleasant, but we got no nearer. We can't sit here and learn the language. Terry protested."], ["820", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>She laid a firm, delicate hand on her gold green jerkin. Ellador this was pleasant, but we got no nearer. We can't sit here and learn the language. Terry protested.<|im_end|>", 0.9223955273628235, 1.0283753871917725, "She laid a firm, delicate hand on her gold green jerkin. Ellador, this was pleasant, but we got no nearer. We can't sit here and learn the language. Terry protested."], ["820", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>he cried out sadly and fought and struggled two minutes however he did little against his four adversaries and worn out with his struggle clive suddenly went from dusty boy to motionless spirit lost lost he muttered all lost<|im_end|>", -0.10845243185758591, 0.03154230862855911, "he cried out savagely and fought with the strength of two men however he could do little against his four adversaries and worn out with the struggle collapsed suddenly on to the dusty floor with a motion of despair lost lost he muttered all lost"], ["820", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>he cried out sadly and fought and strived for two minutes however he did little against his four adversaries and worn out with his struggle, clapped suddenly on the dusty floor with a motionless spirit lost, lost he muttered all lost<|im_end|>", 0.1065172553062439, 1.328436017036438, "he cried out savagely and fought with the strength of two men however he could do little against his four adversaries and worn out with the struggle collapsed suddenly on to the dusty floor with a motion of despair lost lost he muttered all lost"], ["820", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>he cried out sadly and fought and struggled two minutes however he did little against four adversaries and worn out with his struggle clive suddenly went from dusty boy with emotion in his spirit lost, lost, he muttered, all lost<|im_end|>", -0.29121696949005127, -1.0710604190826416, "he cried out savagely and fought with the strength of two men however he could do little against his four adversaries and worn out with the struggle collapsed suddenly on to the dusty floor with a motion of despair lost lost he muttered all lost"], ["820", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>he cried out sadly and fought and struggled to win it however he did little against four adversaries and worn out with his struggle clive suddenly hung from the dusty floor with emotion in his spirit lost, lost he muttered all, lost<|im_end|>", -0.16157105565071106, -0.28891777992248535, "he cried out savagely and fought with the strength of two men however he could do little against his four adversaries and worn out with the struggle collapsed suddenly on to the dusty floor with a motion of despair lost lost he muttered all lost"], ["820", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>And thus he accomplished this by the bye during the siege of the city, for he had his enemies in great contempt already. Nine when he had thus married mariamne.<|im_end|>", 0.6356512308120728, -1.4962533712387085, "And thus he accomplished this by the by, during the siege of the city. For he had his enemies in great contempt already nine when he had thus married mariamne, he."], ["820", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>And thus he accomplished this by the bye during the siege of the city, for he had his enemies in great contempt already nine when he had thus married mariamne.<|im_end|>", 0.715508222579956, 0.49875012040138245, "And thus he accomplished this by the by, during the siege of the city. For he had his enemies in great contempt already nine when he had thus married mariamne, he."], ["820", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>And thus he accomplished this by the bye during the siege of the city, for he had his enemies in great contempt already nine when he had thus married mariamne.<|im_end|>", 0.715508222579956, 0.49875012040138245, "And thus he accomplished this by the by, during the siege of the city. For he had his enemies in great contempt already nine when he had thus married mariamne, he."], ["820", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>And thus he accomplished this by the bye during the siege of the city, for he had his enemies in great contempt already nine when he had thus married mariamne.<|im_end|>", 0.715508222579956, 0.49875012040138245, "And thus he accomplished this by the by, during the siege of the city. For he had his enemies in great contempt already nine when he had thus married mariamne, he."], ["820", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Putting both hands on her shoulders and looking into the brown eyes, should you be willing to go abroad with your mother and phronsie mister king and jasper? Oh polly gasped. But you.<|im_end|>", 0.7878445386886597, -0.38495707511901855, "Putting both hands on her shoulders and looking into the brown eyes, should you be willing to go abroad with your mother and phronsie, mister king and jasper? Oh, polly gasped, but you."], ["820", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Putting both hands on her shoulders and looking into the brown eyes, should you be willing to go abroad with your mother and phronsie? Mister king and jasper. Oh polly gasped but you.<|im_end|>", 0.7167295217514038, -1.1612764596939087, "Putting both hands on her shoulders and looking into the brown eyes, should you be willing to go abroad with your mother and phronsie, mister king and jasper? Oh, polly gasped, but you."], ["820", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Putting both hands on her shoulders and looking into the brown eyes, should you be willing to go abroad with your mother and phronsie, mister king and jasper? Oh Polly gasped, but you.<|im_end|>", 0.9294845461845398, 1.1612406969070435, "Putting both hands on her shoulders and looking into the brown eyes, should you be willing to go abroad with your mother and phronsie, mister king and jasper? Oh, polly gasped, but you."], ["820", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Putting both hands on her shoulders and looking into the brown eyes, should you be willing to go abroad with your mother and phronsie mister king and jasper? Oh, polly gasped. But you.<|im_end|>", 0.858376145362854, 0.3849935233592987, "Putting both hands on her shoulders and looking into the brown eyes, should you be willing to go abroad with your mother and phronsie, mister king and jasper? Oh, polly gasped, but you."]]}
|
wandb/run-20260418_172847-c2a5hfz3/files/media/table/completions_43_9ca1008a424f8bb91c1c.table.json
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"columns": ["step", "prompt", "completion", "ASRWerSubLenCmpHalluDirtyV56", "advantages", "solution"], "data": [["85", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Hospitality to persuasion, dissuasion and evasion, a rebel.<|im_end|>", -0.0990181490778923, 0.05529142543673515, "Hospitable to persuasion, dissuasion and evasion. Rebel."], ["85", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Hospitality to persuasion, dissuasion and evasion a rebel.<|im_end|>", -0.09743088483810425, 0.06276065856218338, "Hospitable to persuasion, dissuasion and evasion. Rebel."], ["85", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Hospitality to persuasion, dissuasion and evasion, a rebel.<|im_end|>", -0.0990181490778923, 0.05529142543673515, "Hospitable to persuasion, dissuasion and evasion. Rebel."], ["85", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Hospitality to persuasion, dissuasion and evasion of a rebel.<|im_end|>", -0.6668598651885986, -2.6168177127838135, "Hospitable to persuasion, dissuasion and evasion. Rebel."], ["85", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Hospitality to persuasion, dissuasion and evasion a rebel.<|im_end|>", -0.09743088483810425, 0.06276065856218338, "Hospitable to persuasion, dissuasion and evasion. Rebel."], ["85", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Hospitality to persuasion, dissuasion and evasion, a rebel.<|im_end|>", -0.0990181490778923, 0.05529142543673515, "Hospitable to persuasion, dissuasion and evasion. Rebel."], ["85", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Hospitality to persuasion, dissuasion and evasion a rebel.<|im_end|>", -0.09743088483810425, 0.06276065856218338, "Hospitable to persuasion, dissuasion and evasion. Rebel."], ["85", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Hospitality to persuasion, dissuasion and evasion, a rebel.<|im_end|>", -0.0990181490778923, 0.05529142543673515, "Hospitable to persuasion, dissuasion and evasion. Rebel."], ["85", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Hospitable to persuasion, dissuasion and evasion, a rebel.<|im_end|>", 0.31988954544067383, 2.026557445526123, "Hospitable to persuasion, dissuasion and evasion. Rebel."], ["85", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Hospitality to persuasion, dissuasion and evasion a rebel.<|im_end|>", -0.09743088483810425, 0.06276065856218338, "Hospitable to persuasion, dissuasion and evasion. Rebel."], ["85", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Hospitality to persuasion, dissuasion and evasion, a rebel.<|im_end|>", -0.0990181490778923, 0.05529142543673515, "Hospitable to persuasion, dissuasion and evasion. Rebel."], ["85", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Hospitality to persuasion, dissuasion and evasion a rebel.<|im_end|>", -0.09743088483810425, 0.06276065856218338, "Hospitable to persuasion, dissuasion and evasion. Rebel."], ["85", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>But my sister must know you, she must until she need. Added richard pentecost.<|im_end|>", -0.9152219295501709, -1.1293256282806396, "Ah, but my sister must know you. She must, in case of need, have you to depend upon."], ["85", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Ah, but my sister must know you she must until she need had reached a point of health.<|im_end|>", -0.8091338276863098, 0.08761630952358246, "Ah, but my sister must know you. She must, in case of need, have you to depend upon."], ["85", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Ah, but my sister must know you she must until she need had reached a point of calm.<|im_end|>", -0.805532693862915, 0.12892509996891022, "Ah, but my sister must know you. She must, in case of need, have you to depend upon."], ["85", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>But my sister must know you, she must until she need had reached a point of time.<|im_end|>", -0.9473012685775757, -1.4973094463348389, "Ah, but my sister must know you. She must, in case of need, have you to depend upon."], ["85", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Ah, but my sister must know you, she must until he's met college de pontiac.<|im_end|>", -0.7323250770568848, 0.9686933755874634, "Ah, but my sister must know you. She must, in case of need, have you to depend upon."], ["85", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Ah, but my sister must know you she must until he's met had reached a point of it.<|im_end|>", -0.8147860765457153, 0.022779079154133797, "Ah, but my sister must know you. She must, in case of need, have you to depend upon."], ["85", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Ah, but my sister must know you she must until her death. I urged a point of time.<|im_end|>", -0.8164224624633789, 0.0040080128237605095, "Ah, but my sister must know you. She must, in case of need, have you to depend upon."], ["85", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Ah, but my sister must know you she must until she need had reached a point of time.<|im_end|>", -0.8074418306350708, 0.10702529549598694, "Ah, but my sister must know you. She must, in case of need, have you to depend upon."], ["85", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Ah, but my sister must know you she must until she need had reached a point of calm.<|im_end|>", -0.805532693862915, 0.12892509996891022, "Ah, but my sister must know you. She must, in case of need, have you to depend upon."], ["85", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Ah, but my sister must know you. She must until she need have reached a point of that.<|im_end|>", -0.6205787658691406, 2.2505409717559814, "Ah, but my sister must know you. She must, in case of need, have you to depend upon."], ["85", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>But my sister must know you, she must until tonight. Added, reached a pinnacle.<|im_end|>", -0.919543445110321, -1.1788979768753052, "Ah, but my sister must know you. She must, in case of need, have you to depend upon."], ["85", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Ah, but my sister must know you she must until she need had reached a point of that.<|im_end|>", -0.8074418306350708, 0.10702529549598694, "Ah, but my sister must know you. She must, in case of need, have you to depend upon."], ["85", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>My fellow, come along. He caught my arm and following our guide we hurried on through the darkness which was so dense that it did not bide to the wonderful eyesight of my black companion. A faculty which seemed to have been acquired.<|im_end|>", 0.5165535807609558, 1.6058197021484375, "black fellow come along he caught my arm and following our guide we hurried on through the darkness which was so dense that if it had not been for the wonderful eyesight of my black companion a faculty which seemed to have been acquired"], ["85", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>My fellow, come along. He caught my arm and following our guide we hurried on through the darkness which was so dense that it did not bid for the wonderful eyesight of my black companion. On the faculty which seemed to admit acquired.<|im_end|>", 0.34349849820137024, 0.2518061101436615, "black fellow come along he caught my arm and following our guide we hurried on through the darkness which was so dense that if it had not been for the wonderful eyesight of my black companion a faculty which seemed to have been acquired"], ["85", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>My fellow, come along. He cut my arm and following our guide we hurried on through the darkness which was so dense that it did not bid for the wonderful eyesight of my black companion. On the faculty which seemed to admit of acquired.<|im_end|>", 0.2730351984500885, -0.299511194229126, "black fellow come along he caught my arm and following our guide we hurried on through the darkness which was so dense that if it had not been for the wonderful eyesight of my black companion a faculty which seemed to have been acquired"], ["85", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>My fellow, come along. He caught my arm and following our guide we hurried on through the darkness which was so dense that it did not bide for the wonderful eyesight of my black companion. The faculty with speed to admit acquired.<|im_end|>", 0.2683812379837036, -0.33592459559440613, "black fellow come along he caught my arm and following our guide we hurried on through the darkness which was so dense that if it had not been for the wonderful eyesight of my black companion a faculty which seemed to have been acquired"], ["85", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>My fellow, come along. He caught my arm and following our guide we hurried on through the darkness which was so dense that it did not bide for the wonderful eyesight of my black companion. On the faculty with speed to admit the acquired.<|im_end|>", 0.20993445813655853, -0.7932225465774536, "black fellow come along he caught my arm and following our guide we hurried on through the darkness which was so dense that if it had not been for the wonderful eyesight of my black companion a faculty which seemed to have been acquired"], ["85", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>My fellow, come along. He caught my arm and following our guide we hurried on through the darkness which was so dense that it did not bid for the wonderful eyesight of my black companion. A faculty which seemed to have been acquired.<|im_end|>", 0.5796752572059631, 2.0996947288513184, "black fellow come along he caught my arm and following our guide we hurried on through the darkness which was so dense that if it had not been for the wonderful eyesight of my black companion a faculty which seemed to have been acquired"], ["85", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>My fellow, come along. He caught my arm and following our guide we hurried on through the darkness which was so dense that it did not bid for the wonderful eyesight of my black companion. On the faculty which seemed to admit of acquired.<|im_end|>", 0.3366594910621643, 0.19829651713371277, "black fellow come along he caught my arm and following our guide we hurried on through the darkness which was so dense that if it had not been for the wonderful eyesight of my black companion a faculty which seemed to have been acquired"], ["85", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>My fellow, come along. He caught my arm and following our guide we hurried on through the darkness which was so dense that it did not bid for the wonderful eyesight of my black companion. On the faculty which seemed to admit of acquired.<|im_end|>", 0.3366594910621643, 0.19829651713371277, "black fellow come along he caught my arm and following our guide we hurried on through the darkness which was so dense that if it had not been for the wonderful eyesight of my black companion a faculty which seemed to have been acquired"], ["85", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>My fellow, come along. He caught my arm and following our guide we hurried on through the darkness which was so dense that it did not bid for the wonderful eyesight of my black companion. I was faculty with speed to a myth of acquired.<|im_end|>", 0.15785956382751465, -1.2006657123565674, "black fellow come along he caught my arm and following our guide we hurried on through the darkness which was so dense that if it had not been for the wonderful eyesight of my black companion a faculty which seemed to have been acquired"], ["85", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>My fellow, come along. He cut my arm and following our guide we hurried on through the darkness which was so dense that it did not bid for the wonderful eyesight of my black companion. On the faculty which seemed to admit of acquired.<|im_end|>", 0.2730351984500885, -0.299511194229126, "black fellow come along he caught my arm and following our guide we hurried on through the darkness which was so dense that if it had not been for the wonderful eyesight of my black companion a faculty which seemed to have been acquired"], ["85", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>My fellow, come along. He caught my arm and following our guide we hurried on through the darkness which was so dense that it did not bid for the wonderful eyesight of my black companion. By the faculty which seemed to admit it, I inquired.<|im_end|>", 0.2825254499912262, -0.22525779902935028, "black fellow come along he caught my arm and following our guide we hurried on through the darkness which was so dense that if it had not been for the wonderful eyesight of my black companion a faculty which seemed to have been acquired"], ["85", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>My fellow, come along. He cut my arm and following our guide we hurried on through the darkness which was so dense that it did not bide for the wonderful eyesight of my black companion. On the faculty which speeded him inquired.<|im_end|>", 0.15796764194965363, -1.1998201608657837, "black fellow come along he caught my arm and following our guide we hurried on through the darkness which was so dense that if it had not been for the wonderful eyesight of my black companion a faculty which seemed to have been acquired"], ["85", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Scrapper's slightly raised cap seemed all black, but Peter turned up close enough and what he found couldn't eat was a patch of brown fur. While Peter sat staring up at him, Scrapper suddenly darted out into the air.<|im_end|>", 0.11510307341814041, 2.3401176929473877, "Scrapper's slightly raised cap seemed all black. But if peter could have gotten close enough, he would have found that hidden in it was a patch of orange red. While peter sat staring up at him, scrapper suddenly darted out into the air."], ["85", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Scrapper's slightly raised cap seemed all black and quite quite ugly, so that he really found it good indeed was a patch of pure white while peter sat staring up at him scrapper suddenly darted out into the air.<|im_end|>", -0.09485074132680893, -1.0294468402862549, "Scrapper's slightly raised cap seemed all black. But if peter could have gotten close enough, he would have found that hidden in it was a patch of orange red. While peter sat staring up at him, scrapper suddenly darted out into the air."], ["85", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Scrapper's slightly raised cap seemed, while black but dark and ugly close enough in a way that he couldn't eat was a patch of clear thread. While Peter sat staring up at him, Scrapper suddenly darted out into the air.<|im_end|>", -0.10472522675991058, -1.1879230737686157, "Scrapper's slightly raised cap seemed all black. But if peter could have gotten close enough, he would have found that hidden in it was a patch of orange red. While peter sat staring up at him, scrapper suddenly darted out into the air."], ["85", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Scrapper's slightly raised cap seemed all black, but in a corner close enough to where he had found good meat was a patch of brown fur. While Peter sat staring up at him, Scrapper suddenly darted out into the air.<|im_end|>", 0.03434121981263161, 1.0439646244049072, "Scrapper's slightly raised cap seemed all black. But if peter could have gotten close enough, he would have found that hidden in it was a patch of orange red. While peter sat staring up at him, scrapper suddenly darted out into the air."], ["85", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Scrapper's slightly raised cap seemed by black, but Peter couldn't get close enough and what he found couldn't eat was a patch of iron thread while peter sat staring up at him scrapper suddenly darted out into the air.<|im_end|>", -0.019613485783338547, 0.17804156243801117, "Scrapper's slightly raised cap seemed all black. But if peter could have gotten close enough, he would have found that hidden in it was a patch of orange red. While peter sat staring up at him, scrapper suddenly darted out into the air."], ["85", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Scrapper's slightly raised cap seemed mob black like a peanut gum kerosene, and what he found couldn't eat was a patch of burned hair. While Peter sat staring up at him, Scrapper suddenly darted out into the air.<|im_end|>", -0.09868084639310837, -1.0909165143966675, "Scrapper's slightly raised cap seemed all black. But if peter could have gotten close enough, he would have found that hidden in it was a patch of orange red. While peter sat staring up at him, scrapper suddenly darted out into the air."], ["85", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Scrapper's slightly raised cap seemed rather black, but Peter put it down cautiously and what he found couldn't eat was a patch of brown fur. While Peter sat staring up at him, Scrapper suddenly darted out into the air.<|im_end|>", -0.027708640322089195, 0.048121821135282516, "Scrapper's slightly raised cap seemed all black. But if peter could have gotten close enough, he would have found that hidden in it was a patch of orange red. While peter sat staring up at him, scrapper suddenly darted out into the air."], ["85", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Scrapper's slightly raised cap seemed rather black, but Peter couldn't go closer than he really found it good and neat was a patch of fine fur while Peter sat staring up at him scrapper suddenly darted out into the air.<|im_end|>", -0.034929804503917694, -0.06777118146419525, "Scrapper's slightly raised cap seemed all black. But if peter could have gotten close enough, he would have found that hidden in it was a patch of orange red. While peter sat staring up at him, scrapper suddenly darted out into the air."], ["85", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Scrapper's slightly raised cap seemed rather black, but peter put it down close enough that he really found it good and neat as a patch of pure thread. While peter sat staring up at him, scrapper suddenly darted out into the air.<|im_end|>", -0.0638682171702385, -0.5322059392929077, "Scrapper's slightly raised cap seemed all black. But if peter could have gotten close enough, he would have found that hidden in it was a patch of orange red. While peter sat staring up at him, scrapper suddenly darted out into the air."], ["85", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Scrapper's slightly raised cap seemed rather black, but Peter couldn't get close enough to look down and could n't eat was a patch of pure white. While Peter sat staring up at him, Scrapper suddenly darted out into the air.<|im_end|>", -0.03125457838177681, -0.008787202648818493, "Scrapper's slightly raised cap seemed all black. But if peter could have gotten close enough, he would have found that hidden in it was a patch of orange red. While peter sat staring up at him, scrapper suddenly darted out into the air."], ["85", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Scrapper's slightly raised cap seemed all black, but through it came a glimpse of that he had really found good and eat was a patch of brown fur. While Peter sat staring up at him, Scrapper suddenly darted out into the air.<|im_end|>", 0.005603947211056948, 0.5827580094337463, "Scrapper's slightly raised cap seemed all black. But if peter could have gotten close enough, he would have found that hidden in it was a patch of orange red. While peter sat staring up at him, scrapper suddenly darted out into the air."], ["85", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Scrapper's slightly raised cap seemed odd black, but Peter couldn't have told you that he really found it good and neat as a patch of fine thread while Peter sat staring up at him Scrapper suddenly darted out into the air.<|im_end|>", -0.04790138080716133, -0.2759529650211334, "Scrapper's slightly raised cap seemed all black. But if peter could have gotten close enough, he would have found that hidden in it was a patch of orange red. While peter sat staring up at him, scrapper suddenly darted out into the air."]]}
|
wandb/run-20260418_172847-c2a5hfz3/files/media/table/completions_63_9c15897616f0ff0b68b9.table.json
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"columns": ["step", "prompt", "completion", "ASRWerSubLenCmpHalluDirtyV56", "advantages", "solution"], "data": [["125", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Or go on forever without swerving to the right or to the left that is what it means to escape this paralysis you should ask how does a straight line feel it feels as I suppose it must straight<|im_end|>", 0.8176915645599365, -0.15929217636585236, "or go on forever without swerving to the right or to the left that is what it means to escape this moralizing you should ask how does the straight line feel it feels as i suppose it looks straight"], ["125", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Or go on forever without swerving to the right or to the left that is what it means to escape this paralysis you should ask how does a straight line feel it feels as I suppose it must straight<|im_end|>", 0.8176915645599365, -0.15929217636585236, "or go on forever without swerving to the right or to the left that is what it means to escape this moralizing you should ask how does the straight line feel it feels as i suppose it looks straight"], ["125", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Or go on forever without swerving to the right or to the left that is what it means to escape this paralysis you should ask how does the straight line feel it feels as I suppose it must straight<|im_end|>", 0.8759769797325134, 0.7718859910964966, "or go on forever without swerving to the right or to the left that is what it means to escape this moralizing you should ask how does the straight line feel it feels as i suppose it looks straight"], ["125", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Or go on forever without swerving to the right or to the left that is what it means to escape this paralysis you should ask how does the straight line feel it feels as I suppose it must straight<|im_end|>", 0.8759769797325134, 0.7718859910964966, "or go on forever without swerving to the right or to the left that is what it means to escape this moralizing you should ask how does the straight line feel it feels as i suppose it looks straight"], ["125", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Or go on forever without swerving to the right or to the left that is what it means to escape this paralysis you should ask how does the straight line feel it feels as I suppose it must straight<|im_end|>", 0.8759769797325134, 0.7718859910964966, "or go on forever without swerving to the right or to the left that is what it means to escape this moralizing you should ask how does the straight line feel it feels as i suppose it looks straight"], ["125", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Or go on forever without stopping to the right or to the left that is what it means to escape this paralysis you should ask how does the straight line feel it feels as I suppose it must straight<|im_end|>", 0.8153555989265442, -0.19661197066307068, "or go on forever without swerving to the right or to the left that is what it means to escape this moralizing you should ask how does the straight line feel it feels as i suppose it looks straight"], ["125", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Or go on forever without stopping to the right or to the left that is what it means to escape this paralysis you should ask how does the straight line feel it feels as I suppose it must straight<|im_end|>", 0.8153555989265442, -0.19661197066307068, "or go on forever without swerving to the right or to the left that is what it means to escape this moralizing you should ask how does the straight line feel it feels as i suppose it looks straight"], ["125", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Or go on forever without stopping to the right or to the left that is what it means to escape the spiral axis you should ask how does a straight line feel it feels as I suppose it must straight<|im_end|>", 0.6529189348220825, -2.791729211807251, "or go on forever without swerving to the right or to the left that is what it means to escape this moralizing you should ask how does the straight line feel it feels as i suppose it looks straight"], ["125", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Or go on forever without swerving to the right or to the left that is what it means to escape this paralysis you should ask how does the straight line feel it feels as I suppose it must straight<|im_end|>", 0.8759769797325134, 0.7718859910964966, "or go on forever without swerving to the right or to the left that is what it means to escape this moralizing you should ask how does the straight line feel it feels as i suppose it looks straight"], ["125", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Or go on forever without swerving to the right or to the left that is what it means to escape this paralysis you should ask how does the straight line feel it feels as I suppose it must straight<|im_end|>", 0.8759769797325134, 0.7718859910964966, "or go on forever without swerving to the right or to the left that is what it means to escape this moralizing you should ask how does the straight line feel it feels as i suppose it looks straight"], ["125", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Or go on forever without swerving to the right or to the left that is what it means to escape this paralysis you should ask how does a straight line feel it feels as I suppose it must straight<|im_end|>", 0.8176915645599365, -0.15929217636585236, "or go on forever without swerving to the right or to the left that is what it means to escape this moralizing you should ask how does the straight line feel it feels as i suppose it looks straight"], ["125", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Or go on forever without stopping to the right or to the left that is what it means to escape this paralysis you should ask how does the straight line feel it feels as I suppose it must straight<|im_end|>", 0.8153555989265442, -0.19661197066307068, "or go on forever without swerving to the right or to the left that is what it means to escape this moralizing you should ask how does the straight line feel it feels as i suppose it looks straight"], ["125", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>They twist his foot and beat him again, in another place. He that flattereth his neighbour spreadeth a net for mischief. So I will try to keep away from that lady, shall I not papa? Whenever you can do so without ruin this daughter.<|im_end|>", 0.04660210758447647, -0.13953234255313873, "Favor is deceitful, and beauty is vain. And in another place, he that flattereth his neighbor spreadeth a net for his feet. So I will try to keep away from that lady, shall I not? Papa, whenever you can do so without rudeness. Daughter."], ["125", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>They twist his neck and make him sing in another place, he that flattereth his neighbour spreadeth a net for his feet. So I will try to keep away from that lady, shall I not papa? Whenever you can do so without rudeness, daughter.<|im_end|>", 0.2873304486274719, 1.2487980127334595, "Favor is deceitful, and beauty is vain. And in another place, he that flattereth his neighbor spreadeth a net for his feet. So I will try to keep away from that lady, shall I not? Papa, whenever you can do so without rudeness. Daughter."], ["125", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>They twist and twist, and do as they will, in another place. He that flattereth his neighbour spreadeth a net for his gain. So I will try to keep away from that lady. Shall I not papa? Whenever you can do so without ruin, my daughter.<|im_end|>", 0.04480805993080139, -0.14987899363040924, "Favor is deceitful, and beauty is vain. And in another place, he that flattereth his neighbor spreadeth a net for his feet. So I will try to keep away from that lady, shall I not? Papa, whenever you can do so without rudeness. Daughter."], ["125", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>They twist and fold, and bend and sin in some other place he that flattereth his neighbour spreadeth a net for him so I will try to keep away from that lately shall I not papa whenever you can do so without rudeness daughter<|im_end|>", -0.06204881891608238, -0.7661447525024414, "Favor is deceitful, and beauty is vain. And in another place, he that flattereth his neighbor spreadeth a net for his feet. So I will try to keep away from that lady, shall I not? Papa, whenever you can do so without rudeness. Daughter."], ["125", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>save rooster's nest and bird's ass in another place, he that flattereth his neighbour spreadeth a net for himself. So I will try to keep away from that lady, shall I not papa? Whenever you can do so without rudeness, daughter.<|im_end|>", 0.25164204835891724, 1.0429755449295044, "Favor is deceitful, and beauty is vain. And in another place, he that flattereth his neighbor spreadeth a net for his feet. So I will try to keep away from that lady, shall I not? Papa, whenever you can do so without rudeness. Daughter."], ["125", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>They will see you there, and be as angry in another place. He that flattereth his neighbour spreadeth him nighfully. So I will try to keep away from that lady, shall I not papa? Whenever you can do so without rudeness, daughter.<|im_end|>", -0.12804561853408813, -1.1467620134353638, "Favor is deceitful, and beauty is vain. And in another place, he that flattereth his neighbor spreadeth a net for his feet. So I will try to keep away from that lady, shall I not? Papa, whenever you can do so without rudeness. Daughter."], ["125", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>save his sister's life and do as i say in another place, he that flattereth his neighbour spreadeth a net for him so I will try to keep away from that lady shall I not papa? Whenever you can do so without ruining this daughter.<|im_end|>", 0.05892462283372879, -0.06846584379673004, "Favor is deceitful, and beauty is vain. And in another place, he that flattereth his neighbor spreadeth a net for his feet. So I will try to keep away from that lady, shall I not? Papa, whenever you can do so without rudeness. Daughter."], ["125", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>They twist and wriggle, and do as they can. And in another place he that flattereth his neighbour spreadeth a net for him. So I will try to keep away from that lady, shall I not papa? Whenever you can do so without rudeness, daughter.<|im_end|>", 0.12734483182430267, 0.32612770795822144, "Favor is deceitful, and beauty is vain. And in another place, he that flattereth his neighbor spreadeth a net for his feet. So I will try to keep away from that lady, shall I not? Papa, whenever you can do so without rudeness. Daughter."], ["125", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>They twist and twirl, and turn and spin. And in another place, he that flattereth his neighbour spreadeth a net for his gain. So I will try to keep away from that way. Shall I not papa? Whenever you can do so without rudeness, daughter.<|im_end|>", 0.2292451709508896, 0.9138080477714539, "Favor is deceitful, and beauty is vain. And in another place, he that flattereth his neighbor spreadeth a net for his feet. So I will try to keep away from that lady, shall I not? Papa, whenever you can do so without rudeness. Daughter."], ["125", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>They please to see me and do as I say in another place he that flattereth his neighbour spreadeth him nectarously so I will try to keep away from that lady shall I not papa whenever you can do so without ruining us daughter<|im_end|>", -0.3151572346687317, -2.2258734703063965, "Favor is deceitful, and beauty is vain. And in another place, he that flattereth his neighbor spreadeth a net for his feet. So I will try to keep away from that lady, shall I not? Papa, whenever you can do so without rudeness. Daughter."], ["125", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>save his sister and do as he does in another place, he that flattereth his neighbour spreadeth a net for himself. So I will try to keep away from that lady, shall I not papa? Whenever you can do so without robbing his daughter.<|im_end|>", 0.1756473332643509, 0.6046982407569885, "Favor is deceitful, and beauty is vain. And in another place, he that flattereth his neighbor spreadeth a net for his feet. So I will try to keep away from that lady, shall I not? Papa, whenever you can do so without rudeness. Daughter."], ["125", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>They will, said he and do as they please. And in another place, he that flattereth his neighbour spreadeth a net for him. So I will try to keep away from that lady, shall I not papa? Whenever you can do so without robbing this daughter.<|im_end|>", 0.13326135277748108, 0.36024948954582214, "Favor is deceitful, and beauty is vain. And in another place, he that flattereth his neighbor spreadeth a net for his feet. So I will try to keep away from that lady, shall I not? Papa, whenever you can do so without rudeness. Daughter."], ["125", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>I was so anxious to hear a little about him to know what I could keep away that's another thing and shows me that if I didn't teach my boys anything else I did give them brotherly love that when they say how good we were in our services to all who came<|im_end|>", -0.27307480573654175, -0.7399817705154419, "i was so anxious to hear all about the dear old boy i couldn't keep away that's right comfortable and shows me that if i didn't teach my boys anything else i did give them the brotherly love that will make them stand by one another all their lives said missus jo when he had gone"], ["125", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>I was so anxious to hear a little about you to know what I could keep away that's enough and shows me that if I didn't teach my boys anything else, I did give them brotherly love, but with a samurai or battle of war civilities too formal<|im_end|>", -0.43343213200569153, -2.054769992828369, "i was so anxious to hear all about the dear old boy i couldn't keep away that's right comfortable and shows me that if i didn't teach my boys anything else i did give them the brotherly love that will make them stand by one another all their lives said missus jo when he had gone"], ["125", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>I was so anxious to hear about her, to know what I could keep away that's enough of it and shows me that if I didn't teach my boys anything else I did give them brotherly love that made their sad and lonely hours seem a little more palatable<|im_end|>", -0.2620263695716858, -0.6493943333625793, "i was so anxious to hear all about the dear old boy i couldn't keep away that's right comfortable and shows me that if i didn't teach my boys anything else i did give them the brotherly love that will make them stand by one another all their lives said missus jo when he had gone"], ["125", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>I was so anxious to hear a little about him, to know what I could keep away that's another thing and shows me that if I didn't teach my boys anything else I did give them brotherly love that when they say nothing of their own or some one is stupid or weak.<|im_end|>", -0.21280650794506073, -0.24583503603935242, "i was so anxious to hear all about the dear old boy i couldn't keep away that's right comfortable and shows me that if i didn't teach my boys anything else i did give them the brotherly love that will make them stand by one another all their lives said missus jo when he had gone"], ["125", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>I was so anxious to hear about you, dear boy, I couldn't keep away. That's another thing and shows me that if I didn't teach my boys anything else, I did give them a brotherly love that made their sad hour of trouble worse than the sickness itself.<|im_end|>", -0.23551680147647858, -0.432039350271225, "i was so anxious to hear all about the dear old boy i couldn't keep away that's right comfortable and shows me that if i didn't teach my boys anything else i did give them the brotherly love that will make them stand by one another all their lives said missus jo when he had gone"], ["125", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>I was so anxious to hear a little about him to know what I could keep away that's enough of it and shows me that if I didn't teach my boys anything else I did give them brotherly love that will render Sam happy or make their mothers' sinlessness superfluous<|im_end|>", -0.18895041942596436, -0.05023622140288353, "i was so anxious to hear all about the dear old boy i couldn't keep away that's right comfortable and shows me that if i didn't teach my boys anything else i did give them the brotherly love that will make them stand by one another all their lives said missus jo when he had gone"], ["125", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>I was so anxious to hear a little about her to a boy I couldn't keep away that's enough and shows me that if I didn't teach my boys anything else I did give them brotherly love that will in a sad hour bring back their own personal sympathies to my heart<|im_end|>", -0.0468180887401104, 1.1151231527328491, "i was so anxious to hear all about the dear old boy i couldn't keep away that's right comfortable and shows me that if i didn't teach my boys anything else i did give them the brotherly love that will make them stand by one another all their lives said missus jo when he had gone"], ["125", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>I was so anxious to hear a mother talk to her boy I couldn't keep away that's another proof it shows me that if I didn't teach my boys anything else I did give them brotherly love that will in a sad hour comfort and divert their sicknesses to the morning<|im_end|>", -0.1063055768609047, 0.6273783445358276, "i was so anxious to hear all about the dear old boy i couldn't keep away that's right comfortable and shows me that if i didn't teach my boys anything else i did give them the brotherly love that will make them stand by one another all their lives said missus jo when he had gone"], ["125", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>I was so anxious to hear all about you, dear old boy, I couldn't keep away that's another proof and shows me that if I didn't teach my boys anything else, I did give them brotherly love that led to the same kind of good and bad comparisons as this stupid boy.<|im_end|>", -0.060284294188022614, 1.0047121047973633, "i was so anxious to hear all about the dear old boy i couldn't keep away that's right comfortable and shows me that if i didn't teach my boys anything else i did give them the brotherly love that will make them stand by one another all their lives said missus jo when he had gone"], ["125", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>I was so anxious to hear all about you to a boy I couldn't keep away that's another proof and shows me that if I didn't teach my boys anything else I did give them brotherly love that when they say I'm a good boy I mean I've been a son of sin since school days<|im_end|>", -0.13280440866947174, 0.4101113975048065, "i was so anxious to hear all about the dear old boy i couldn't keep away that's right comfortable and shows me that if i didn't teach my boys anything else i did give them the brotherly love that will make them stand by one another all their lives said missus jo when he had gone"], ["125", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>I was so anxious to hear a lullaby to a boy I could keep away that's enough of him and shows me that if I didn't teach my boys anything else I did give them brotherly love that made their sad hour more bearable than our sinlessness to you all<|im_end|>", -0.2491731345653534, -0.5440092086791992, "i was so anxious to hear all about the dear old boy i couldn't keep away that's right comfortable and shows me that if i didn't teach my boys anything else i did give them the brotherly love that will make them stand by one another all their lives said missus jo when he had gone"], ["125", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>I was so anxious to hear all about it to a boy I couldn't keep away that's enough of him and shows me that if I didn't teach my boys anything else I did give them brotherly love that will in the same way overcome their own worst tendencies too far<|im_end|>", 0.00731202308088541, 1.558942198753357, "i was so anxious to hear all about the dear old boy i couldn't keep away that's right comfortable and shows me that if i didn't teach my boys anything else i did give them the brotherly love that will make them stand by one another all their lives said missus jo when he had gone"], ["125", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Increased materially and therefore also with powers of resistance may easily be conceived with vast quantities of elastic gases what mass of molten matter accumulated beneath its solid surface lost no exit as practicable after the cooling of the trachy crust<|im_end|>", 0.6219021677970886, 0.48375576734542847, "increased materially and therefore also its powers of resistance it may easily be conceived what vast quantities of elastic gases what masses of molten matter accumulated beneath its solid surface whilst no exit was practicable after the cooling of the trachytic crust"], ["125", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Increased materially and therefore also in the powers of resistance may easily be conceived with vast quantities of elastic gases what mass of molten matter accumulated beneath its solid surface whilst no exit is practicable after the cooling of the tribut crust<|im_end|>", 0.6310301423072815, 0.5756562948226929, "increased materially and therefore also its powers of resistance it may easily be conceived what vast quantities of elastic gases what masses of molten matter accumulated beneath its solid surface whilst no exit was practicable after the cooling of the trachytic crust"], ["125", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Increased materially and therefore also in the power of resistance may easily be conceived with vast quantities of elastic gases what mass of molten matter accumulated beneath its solid surface whilst no exit is practicable after the cooling of the trading crust<|im_end|>", 0.5663049817085266, -0.07599729299545288, "increased materially and therefore also its powers of resistance it may easily be conceived what vast quantities of elastic gases what masses of molten matter accumulated beneath its solid surface whilst no exit was practicable after the cooling of the trachytic crust"], ["125", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Increased materially and therefore also in powers of resistance, it may easily be conceived that vast quantities of elastic gases, what mass of molten matter accumulated beneath its solid surface, whilst no exit is practicable after the cooling of the trivet crust.<|im_end|>", 0.4862109422683716, -0.8823849558830261, "increased materially and therefore also its powers of resistance it may easily be conceived what vast quantities of elastic gases what masses of molten matter accumulated beneath its solid surface whilst no exit was practicable after the cooling of the trachytic crust"], ["125", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Increase materially and therefore also the power of resistance it may easily be conceived with vast quantities of elastic gases what mass of molten matter accumulated beneath its solid surface whilst no exit is practicable after the cooling of the trivet crust<|im_end|>", 0.6143525242805481, 0.407745897769928, "increased materially and therefore also its powers of resistance it may easily be conceived what vast quantities of elastic gases what masses of molten matter accumulated beneath its solid surface whilst no exit was practicable after the cooling of the trachytic crust"], ["125", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Increased materially, and therefore also with powers of resistance may easily be conceived a vast quantities of elastic gases what mass of molten matter accumulated beneath its solid surface whilst no exit is practicable after the cooling of the trigate crust<|im_end|>", 0.6209789514541626, 0.47446081042289734, "increased materially and therefore also its powers of resistance it may easily be conceived what vast quantities of elastic gases what masses of molten matter accumulated beneath its solid surface whilst no exit was practicable after the cooling of the trachytic crust"], ["125", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Increase materially and therefore also in the power of resistance may easily be conceived with vast quantities of elastic gases what mass of impalpable matter accumulated beneath its solid surface whilst no exit is practicable after the cooling of the trading crust<|im_end|>", 0.43219640851020813, -1.4262038469314575, "increased materially and therefore also its powers of resistance it may easily be conceived what vast quantities of elastic gases what masses of molten matter accumulated beneath its solid surface whilst no exit was practicable after the cooling of the trachytic crust"], ["125", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Increased materially and therefore also in powers of resistance may easily be conceived with vast quantities of elastic gases what mass of molten matter accumulated beneath its solid surface whilst no exit is practicable after the cooling of the tributary crust<|im_end|>", 0.6819920539855957, 1.088741421699524, "increased materially and therefore also its powers of resistance it may easily be conceived what vast quantities of elastic gases what masses of molten matter accumulated beneath its solid surface whilst no exit was practicable after the cooling of the trachytic crust"], ["125", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Increased materially, and therefore also with powers of resistance may easily be conceived. With vast quantities of elastic gases, what mass of molten matter accumulated beneath its solid surface? Whilst no exit is practicable after the cooling of the trinity crust.<|im_end|>", 0.3609590530395508, -2.1434223651885986, "increased materially and therefore also its powers of resistance it may easily be conceived what vast quantities of elastic gases what masses of molten matter accumulated beneath its solid surface whilst no exit was practicable after the cooling of the trachytic crust"], ["125", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Increase materially and therefore also in powers of resistance may easily be conceived with vast quantities of elastic gases what mass of molten matter accumulated beneath its solid surface whilst no exit is practicable after the cooling of the trading crust<|im_end|>", 0.6215246319770813, 0.4799547493457794, "increased materially and therefore also its powers of resistance it may easily be conceived what vast quantities of elastic gases what masses of molten matter accumulated beneath its solid surface whilst no exit was practicable after the cooling of the trachytic crust"], ["125", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Increased materially and therefore also with powers of resistance may easily be conceived a vast quantities of elastic gases what mass of molten matter accumulated beneath its solid surface whilst no exit is practicable after the cooling of the tribut crust<|im_end|>", 0.6820893883705139, 1.0897213220596313, "increased materially and therefore also its powers of resistance it may easily be conceived what vast quantities of elastic gases what masses of molten matter accumulated beneath its solid surface whilst no exit was practicable after the cooling of the trachytic crust"], ["125", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Increase materially and therefore also the powers of resistance may easily be conceived with vast quantities of elastic gases what mass of molten matter accumulated beneath its solid surface whilst no exit is practicable after the cooling of the trade at crust<|im_end|>", 0.5666987299919128, -0.07203302532434464, "increased materially and therefore also its powers of resistance it may easily be conceived what vast quantities of elastic gases what masses of molten matter accumulated beneath its solid surface whilst no exit was practicable after the cooling of the trachytic crust"]]}
|
wandb/run-20260418_172847-c2a5hfz3/files/output.log
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
wandb/run-20260418_172847-c2a5hfz3/files/requirements.txt
ADDED
|
@@ -0,0 +1,255 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
psutil==7.2.2
|
| 2 |
+
colorama==0.4.6
|
| 3 |
+
typing-inspection==0.4.2
|
| 4 |
+
dill==0.3.8
|
| 5 |
+
aliyun-python-sdk-kms==2.16.5
|
| 6 |
+
urllib3==2.6.3
|
| 7 |
+
torch==2.6.0
|
| 8 |
+
threadpoolctl==3.6.0
|
| 9 |
+
pyzmq==27.1.0
|
| 10 |
+
astor==0.8.1
|
| 11 |
+
hf-xet==1.4.3
|
| 12 |
+
sniffio==1.3.1
|
| 13 |
+
tensorboard==2.20.0
|
| 14 |
+
fastar==0.11.0
|
| 15 |
+
llvmlite==0.43.0
|
| 16 |
+
pathspec==1.0.4
|
| 17 |
+
mkl_fft==1.3.11
|
| 18 |
+
prometheus_client==0.25.0
|
| 19 |
+
async-timeout==5.0.1
|
| 20 |
+
scikit-learn==1.7.2
|
| 21 |
+
sortedcontainers==2.4.0
|
| 22 |
+
Bottleneck==1.4.2
|
| 23 |
+
orjson==3.11.8
|
| 24 |
+
nest-asyncio==1.6.0
|
| 25 |
+
cupy-cuda12x==13.6.0
|
| 26 |
+
semantic-version==2.10.0
|
| 27 |
+
aiosignal==1.4.0
|
| 28 |
+
fsspec==2025.3.0
|
| 29 |
+
dyNET38==2.2
|
| 30 |
+
shellingham==1.5.4
|
| 31 |
+
zstandard==0.25.0
|
| 32 |
+
PyYAML==6.0.3
|
| 33 |
+
nvidia-curand-cu12==10.3.5.147
|
| 34 |
+
gradio==5.50.0
|
| 35 |
+
Werkzeug==3.1.8
|
| 36 |
+
grpcio==1.80.0
|
| 37 |
+
aiohttp==3.13.5
|
| 38 |
+
Flask==3.1.3
|
| 39 |
+
python-json-logger==4.1.0
|
| 40 |
+
trl==0.29.1
|
| 41 |
+
nltk==3.9.4
|
| 42 |
+
platformdirs==4.9.6
|
| 43 |
+
lm-format-enforcer==0.10.12
|
| 44 |
+
pyparsing==3.3.2
|
| 45 |
+
jmespath==0.10.0
|
| 46 |
+
starlette==0.52.1
|
| 47 |
+
crcmod==1.7
|
| 48 |
+
dnspython==2.8.0
|
| 49 |
+
antlr4-python3-runtime==4.9.3
|
| 50 |
+
rouge==1.0.1
|
| 51 |
+
importlib_metadata==9.0.0
|
| 52 |
+
nvidia-cudnn-cu12==9.1.0.70
|
| 53 |
+
safetensors==0.7.0
|
| 54 |
+
blake3==1.0.8
|
| 55 |
+
interegular==0.3.3
|
| 56 |
+
tiktoken==0.11.0
|
| 57 |
+
pydantic_core==2.41.4
|
| 58 |
+
outlines==0.1.11
|
| 59 |
+
airportsdata==20260315
|
| 60 |
+
rich-toolkit==0.19.7
|
| 61 |
+
multiprocess==0.70.16
|
| 62 |
+
sympy==1.13.1
|
| 63 |
+
psutil==7.2.2
|
| 64 |
+
h11==0.16.0
|
| 65 |
+
anyio==4.13.0
|
| 66 |
+
Cython==3.2.4
|
| 67 |
+
outlines_core==0.1.26
|
| 68 |
+
jsonschema==4.26.0
|
| 69 |
+
nvidia-cuda-cupti-cu12==12.4.127
|
| 70 |
+
meson-python==0.19.0
|
| 71 |
+
depyf==0.18.0
|
| 72 |
+
audioread==3.1.0
|
| 73 |
+
typer==0.24.1
|
| 74 |
+
nvidia-cuda-nvrtc-cu12==12.4.127
|
| 75 |
+
joblib==1.5.3
|
| 76 |
+
torchvision==0.21.0
|
| 77 |
+
hf-gradio==0.3.2
|
| 78 |
+
huggingface_hub==0.36.2
|
| 79 |
+
websockets==15.0.1
|
| 80 |
+
diskcache==5.6.3
|
| 81 |
+
mistral_common==1.11.0
|
| 82 |
+
partial-json-parser==0.2.1.1.post7
|
| 83 |
+
simplejson==3.20.2
|
| 84 |
+
watchfiles==1.1.1
|
| 85 |
+
Jinja2==3.1.6
|
| 86 |
+
GitPython==3.1.46
|
| 87 |
+
numexpr==2.11.0
|
| 88 |
+
pydub==0.25.1
|
| 89 |
+
brotli==1.2.0
|
| 90 |
+
binpacking==2.0.1
|
| 91 |
+
cmake==4.3.1
|
| 92 |
+
pydantic==2.12.3
|
| 93 |
+
mkl-service==2.4.0
|
| 94 |
+
protobuf==6.33.6
|
| 95 |
+
gguf==0.10.0
|
| 96 |
+
MarkupSafe==3.0.3
|
| 97 |
+
exceptiongroup==1.3.1
|
| 98 |
+
markdown-it-py==4.0.0
|
| 99 |
+
soxr==1.0.0
|
| 100 |
+
pyarrow==20.0.0
|
| 101 |
+
tqdm==4.67.3
|
| 102 |
+
meson==1.11.0
|
| 103 |
+
fonttools==4.62.1
|
| 104 |
+
annotated-types==0.7.0
|
| 105 |
+
networkx==3.4.2
|
| 106 |
+
nvidia-cuda-runtime-cu12==12.4.127
|
| 107 |
+
compressed-tensors==0.9.2
|
| 108 |
+
wandb==0.23.0
|
| 109 |
+
mdurl==0.1.2
|
| 110 |
+
charset-normalizer==3.4.7
|
| 111 |
+
Pygments==2.20.0
|
| 112 |
+
zipp==3.23.1
|
| 113 |
+
prometheus-fastapi-instrumentator==7.1.0
|
| 114 |
+
aiofiles==24.1.0
|
| 115 |
+
lark==1.2.2
|
| 116 |
+
addict==2.4.0
|
| 117 |
+
pydantic-settings==2.13.1
|
| 118 |
+
opencv-python-headless==4.11.0.86
|
| 119 |
+
certifi==2026.2.25
|
| 120 |
+
sox==1.5.0
|
| 121 |
+
nagisa==0.2.11
|
| 122 |
+
six==1.17.0
|
| 123 |
+
tokenizers==0.22.2
|
| 124 |
+
mkl_random==1.2.8
|
| 125 |
+
fastapi-cloud-cli==0.17.0
|
| 126 |
+
propcache==0.4.1
|
| 127 |
+
cachetools==7.0.5
|
| 128 |
+
rpds-py==0.30.0
|
| 129 |
+
torchaudio==2.6.0
|
| 130 |
+
setuptools==82.0.1
|
| 131 |
+
py-cpuinfo==9.0.0
|
| 132 |
+
tomli==2.4.1
|
| 133 |
+
xxhash==3.6.0
|
| 134 |
+
pip==26.0.1
|
| 135 |
+
contourpy==1.3.2
|
| 136 |
+
absl-py==2.4.0
|
| 137 |
+
mpmath==1.3.0
|
| 138 |
+
ms_swift==4.0.3
|
| 139 |
+
pyproject-metadata==0.11.0
|
| 140 |
+
aiohappyeyeballs==2.6.1
|
| 141 |
+
httpx==0.28.1
|
| 142 |
+
json_repair==0.59.4
|
| 143 |
+
blinker==1.9.0
|
| 144 |
+
tzdata==2025.3
|
| 145 |
+
tensorboard-data-server==0.7.2
|
| 146 |
+
pydantic-extra-types==2.11.1
|
| 147 |
+
Markdown==3.10.2
|
| 148 |
+
nvidia-cusparselt-cu12==0.6.2
|
| 149 |
+
rignore==0.7.6
|
| 150 |
+
openai==2.32.0
|
| 151 |
+
soundfile==0.13.1
|
| 152 |
+
lazy-loader==0.5
|
| 153 |
+
av==14.2.0
|
| 154 |
+
yarl==1.23.0
|
| 155 |
+
python-dateutil==2.9.0.post0
|
| 156 |
+
groovy==0.1.2
|
| 157 |
+
xformers==0.0.29.post2
|
| 158 |
+
qwen-omni-utils==0.0.9
|
| 159 |
+
rich==15.0.0
|
| 160 |
+
xgrammar==0.1.16
|
| 161 |
+
numba==0.60.0
|
| 162 |
+
nvidia-cusolver-cu12==11.6.1.9
|
| 163 |
+
scikit_build_core==0.12.2
|
| 164 |
+
ffmpy==1.0.0
|
| 165 |
+
wheel==0.46.3
|
| 166 |
+
jiter==0.14.0
|
| 167 |
+
oss2==2.19.1
|
| 168 |
+
transformers==4.57.6
|
| 169 |
+
fastrlock==0.8.3
|
| 170 |
+
click==8.3.2
|
| 171 |
+
pooch==1.9.0
|
| 172 |
+
distro==1.9.0
|
| 173 |
+
nvidia-cublas-cu12==12.4.5.8
|
| 174 |
+
regex==2026.4.4
|
| 175 |
+
cpm-kernels==1.0.11
|
| 176 |
+
safehttpx==0.1.7
|
| 177 |
+
matplotlib==3.10.8
|
| 178 |
+
httptools==0.7.1
|
| 179 |
+
nvidia-cusparse-cu12==12.3.1.170
|
| 180 |
+
qwen-asr==0.0.6
|
| 181 |
+
gradio_client==1.14.0
|
| 182 |
+
gitdb==4.0.12
|
| 183 |
+
fastapi-cli==0.0.24
|
| 184 |
+
soynlp==0.0.493
|
| 185 |
+
python-dotenv==1.2.2
|
| 186 |
+
nvidia-cufft-cu12==11.2.1.3
|
| 187 |
+
accelerate==1.12.0
|
| 188 |
+
tomlkit==0.13.3
|
| 189 |
+
triton==3.2.0
|
| 190 |
+
filelock==3.28.0
|
| 191 |
+
pycountry==26.2.16
|
| 192 |
+
modelscope==1.35.4
|
| 193 |
+
annotated-doc==0.0.4
|
| 194 |
+
referencing==0.37.0
|
| 195 |
+
numpy==1.26.4
|
| 196 |
+
aliyun-python-sdk-core==2.16.0
|
| 197 |
+
attrs==26.1.0
|
| 198 |
+
vllm==0.8.0
|
| 199 |
+
python-multipart==0.0.26
|
| 200 |
+
jsonschema-specifications==2025.9.1
|
| 201 |
+
idna==3.11
|
| 202 |
+
scipy==1.15.3
|
| 203 |
+
typing_extensions==4.15.0
|
| 204 |
+
itsdangerous==2.2.0
|
| 205 |
+
msgspec==0.21.1
|
| 206 |
+
msgpack==1.1.2
|
| 207 |
+
nvidia-nvjitlink-cu12==12.4.127
|
| 208 |
+
pycryptodome==3.23.0
|
| 209 |
+
ninja==1.13.0
|
| 210 |
+
pillow==11.3.0
|
| 211 |
+
email-validator==2.3.0
|
| 212 |
+
cryptography==46.0.7
|
| 213 |
+
peft==0.18.1
|
| 214 |
+
kiwisolver==1.5.0
|
| 215 |
+
cffi==2.0.0
|
| 216 |
+
einops==0.8.2
|
| 217 |
+
pytz==2026.1.post1
|
| 218 |
+
uvloop==0.22.1
|
| 219 |
+
requests==2.33.1
|
| 220 |
+
sentencepiece==0.2.1
|
| 221 |
+
attrdict==2.0.1
|
| 222 |
+
dacite==1.9.2
|
| 223 |
+
cloudpickle==3.1.2
|
| 224 |
+
ray==2.55.0
|
| 225 |
+
fastapi==0.135.3
|
| 226 |
+
librosa==0.11.0
|
| 227 |
+
ruff==0.15.10
|
| 228 |
+
multidict==6.7.1
|
| 229 |
+
smmap==5.0.3
|
| 230 |
+
packaging==26.0
|
| 231 |
+
pycparser==3.0
|
| 232 |
+
decorator==5.2.1
|
| 233 |
+
transformers-stream-generator==0.0.5
|
| 234 |
+
nvidia-nccl-cu12==2.21.5
|
| 235 |
+
frozenlist==1.8.0
|
| 236 |
+
uvicorn==0.44.0
|
| 237 |
+
datasets==3.6.0
|
| 238 |
+
cycler==0.12.1
|
| 239 |
+
omegaconf==2.3.0
|
| 240 |
+
httpcore==1.0.9
|
| 241 |
+
pandas==2.3.2
|
| 242 |
+
nvidia-nvtx-cu12==12.4.127
|
| 243 |
+
sentry-sdk==2.58.0
|
| 244 |
+
wheel==0.46.3
|
| 245 |
+
autocommand==2.2.2
|
| 246 |
+
tomli==2.4.0
|
| 247 |
+
packaging==26.0
|
| 248 |
+
more-itertools==10.8.0
|
| 249 |
+
zipp==3.23.0
|
| 250 |
+
platformdirs==4.4.0
|
| 251 |
+
jaraco.context==6.1.0
|
| 252 |
+
jaraco.text==4.0.0
|
| 253 |
+
backports.tarfile==1.2.0
|
| 254 |
+
jaraco.functools==4.4.0
|
| 255 |
+
importlib_metadata==8.7.1
|
wandb/run-20260418_172847-c2a5hfz3/files/wandb-metadata.json
ADDED
|
@@ -0,0 +1,213 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"os": "Linux-3.10.0-957.el7.x86_64-x86_64-with-glibc2.17",
|
| 3 |
+
"python": "CPython 3.10.18",
|
| 4 |
+
"startedAt": "2026-04-18T09:28:47.432340Z",
|
| 5 |
+
"args": [
|
| 6 |
+
"--rlhf_type",
|
| 7 |
+
"grpo",
|
| 8 |
+
"--external_plugins",
|
| 9 |
+
"/mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/0416upload/my_qwen3_asr_dapo_register.py",
|
| 10 |
+
"/mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/0416upload/0417_reward.py",
|
| 11 |
+
"--model",
|
| 12 |
+
"/mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/qwen3-asr-merged",
|
| 13 |
+
"--model_type",
|
| 14 |
+
"my_qwen3_asr_rl",
|
| 15 |
+
"--template",
|
| 16 |
+
"my_qwen3_asr_rl",
|
| 17 |
+
"--dataset",
|
| 18 |
+
"/mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/0416upload/lora_0323_10w+55w+error+syn_with_domain_train90_targeted_rl_train90_loramerged_basewer_3suppress_server.jsonl",
|
| 19 |
+
"--val_dataset",
|
| 20 |
+
"/mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/0416upload/lora_0323_10w+55w+error+syn_with_domain_train90_targeted_rl_val5_sample5p_server.jsonl",
|
| 21 |
+
"--reward_funcs",
|
| 22 |
+
"asr_wer_sub_len_cmp_hallu_dirty_v56",
|
| 23 |
+
"--train_type",
|
| 24 |
+
"lora",
|
| 25 |
+
"--use_vllm",
|
| 26 |
+
"false",
|
| 27 |
+
"--log_completions",
|
| 28 |
+
"true",
|
| 29 |
+
"--loss_type",
|
| 30 |
+
"dapo",
|
| 31 |
+
"--advantage_estimator",
|
| 32 |
+
"grpo",
|
| 33 |
+
"--scale_rewards",
|
| 34 |
+
"group",
|
| 35 |
+
"--num_iterations",
|
| 36 |
+
"2",
|
| 37 |
+
"--beta",
|
| 38 |
+
"0.04",
|
| 39 |
+
"--epsilon_high",
|
| 40 |
+
"0.28",
|
| 41 |
+
"--dynamic_sample",
|
| 42 |
+
"true",
|
| 43 |
+
"--max_resample_times",
|
| 44 |
+
"4",
|
| 45 |
+
"--overlong_filter",
|
| 46 |
+
"true",
|
| 47 |
+
"--truncation_strategy",
|
| 48 |
+
"delete",
|
| 49 |
+
"--num_generations",
|
| 50 |
+
"12",
|
| 51 |
+
"--generation_batch_size",
|
| 52 |
+
"48",
|
| 53 |
+
"--per_device_train_batch_size",
|
| 54 |
+
"4",
|
| 55 |
+
"--per_device_eval_batch_size",
|
| 56 |
+
"4",
|
| 57 |
+
"--gradient_accumulation_steps",
|
| 58 |
+
"12",
|
| 59 |
+
"--num_generations_eval",
|
| 60 |
+
"4",
|
| 61 |
+
"--max_completion_length",
|
| 62 |
+
"256",
|
| 63 |
+
"--temperature",
|
| 64 |
+
"0.50",
|
| 65 |
+
"--top_p",
|
| 66 |
+
"0.95",
|
| 67 |
+
"--top_k",
|
| 68 |
+
"50",
|
| 69 |
+
"--repetition_penalty",
|
| 70 |
+
"1.08",
|
| 71 |
+
"--learning_rate",
|
| 72 |
+
"5e-5",
|
| 73 |
+
"--lr_scheduler_type",
|
| 74 |
+
"cosine",
|
| 75 |
+
"--warmup_ratio",
|
| 76 |
+
"0.03",
|
| 77 |
+
"--report_to",
|
| 78 |
+
"wandb",
|
| 79 |
+
"--run_name",
|
| 80 |
+
"qwen3asr_dapo_reward56_4x4x12_12gen_4GPU",
|
| 81 |
+
"--output_dir",
|
| 82 |
+
"/mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/0416upload/out/qwen3asr_dapo_reward56_4x4x12_12gen_4GPU",
|
| 83 |
+
"--save_strategy",
|
| 84 |
+
"steps",
|
| 85 |
+
"--save_steps",
|
| 86 |
+
"20",
|
| 87 |
+
"--logging_steps",
|
| 88 |
+
"5",
|
| 89 |
+
"--freeze_llm",
|
| 90 |
+
"false",
|
| 91 |
+
"--freeze_vit",
|
| 92 |
+
"false",
|
| 93 |
+
"--freeze_aligner",
|
| 94 |
+
"false",
|
| 95 |
+
"--remove_unused_columns",
|
| 96 |
+
"false",
|
| 97 |
+
"--padding_side",
|
| 98 |
+
"left"
|
| 99 |
+
],
|
| 100 |
+
"program": "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/lib/python3.10/site-packages/swift/cli/rlhf.py",
|
| 101 |
+
"email": "pang_kaiyu@163.com",
|
| 102 |
+
"root": "/mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/0416upload",
|
| 103 |
+
"host": "SH-IDC1-10-140-37-95",
|
| 104 |
+
"executable": "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/bin/python3.10",
|
| 105 |
+
"cpu_count": 64,
|
| 106 |
+
"cpu_count_logical": 128,
|
| 107 |
+
"gpu": "NVIDIA A100-SXM4-80GB",
|
| 108 |
+
"gpu_count": 8,
|
| 109 |
+
"disk": {
|
| 110 |
+
"/": {
|
| 111 |
+
"total": "524945911808",
|
| 112 |
+
"used": "37368901632"
|
| 113 |
+
}
|
| 114 |
+
},
|
| 115 |
+
"memory": {
|
| 116 |
+
"total": "1081627828224"
|
| 117 |
+
},
|
| 118 |
+
"gpu_nvidia": [
|
| 119 |
+
{
|
| 120 |
+
"name": "NVIDIA A100-SXM4-80GB",
|
| 121 |
+
"memoryTotal": "85899345920",
|
| 122 |
+
"cudaCores": 6912,
|
| 123 |
+
"architecture": "Ampere",
|
| 124 |
+
"uuid": "GPU-87e7e3ab-b254-fc22-7407-8e2e88e9d854"
|
| 125 |
+
},
|
| 126 |
+
{
|
| 127 |
+
"name": "NVIDIA A100-SXM4-80GB",
|
| 128 |
+
"memoryTotal": "85899345920",
|
| 129 |
+
"cudaCores": 6912,
|
| 130 |
+
"architecture": "Ampere",
|
| 131 |
+
"uuid": "GPU-976db8a1-cf00-11c6-caaa-413862233fd4"
|
| 132 |
+
},
|
| 133 |
+
{
|
| 134 |
+
"name": "NVIDIA A100-SXM4-80GB",
|
| 135 |
+
"memoryTotal": "85899345920",
|
| 136 |
+
"cudaCores": 6912,
|
| 137 |
+
"architecture": "Ampere",
|
| 138 |
+
"uuid": "GPU-78b37ae8-44e0-e318-a6c0-f6f4ac78d46a"
|
| 139 |
+
},
|
| 140 |
+
{
|
| 141 |
+
"name": "NVIDIA A100-SXM4-80GB",
|
| 142 |
+
"memoryTotal": "85899345920",
|
| 143 |
+
"cudaCores": 6912,
|
| 144 |
+
"architecture": "Ampere",
|
| 145 |
+
"uuid": "GPU-840b937d-a7d4-68e7-ad57-f4568e01c3ae"
|
| 146 |
+
},
|
| 147 |
+
{
|
| 148 |
+
"name": "NVIDIA A100-SXM4-80GB",
|
| 149 |
+
"memoryTotal": "85899345920",
|
| 150 |
+
"cudaCores": 6912,
|
| 151 |
+
"architecture": "Ampere",
|
| 152 |
+
"uuid": "GPU-a9d0de54-f5b5-f83b-7bda-f53db844622d"
|
| 153 |
+
},
|
| 154 |
+
{
|
| 155 |
+
"name": "NVIDIA A100-SXM4-80GB",
|
| 156 |
+
"memoryTotal": "85899345920",
|
| 157 |
+
"cudaCores": 6912,
|
| 158 |
+
"architecture": "Ampere",
|
| 159 |
+
"uuid": "GPU-cb7d22e9-305c-c68c-64f1-599580742db0"
|
| 160 |
+
},
|
| 161 |
+
{
|
| 162 |
+
"name": "NVIDIA A100-SXM4-80GB",
|
| 163 |
+
"memoryTotal": "85899345920",
|
| 164 |
+
"cudaCores": 6912,
|
| 165 |
+
"architecture": "Ampere",
|
| 166 |
+
"uuid": "GPU-8d9704bb-4592-346f-a7f2-1a6ed8d58619"
|
| 167 |
+
},
|
| 168 |
+
{
|
| 169 |
+
"name": "NVIDIA A100-SXM4-80GB",
|
| 170 |
+
"memoryTotal": "85899345920",
|
| 171 |
+
"cudaCores": 6912,
|
| 172 |
+
"architecture": "Ampere",
|
| 173 |
+
"uuid": "GPU-3892f01b-e0b8-a9d9-0587-b5a7d2d9b5ab"
|
| 174 |
+
}
|
| 175 |
+
],
|
| 176 |
+
"cudaVersion": "12.4",
|
| 177 |
+
"slurm": {
|
| 178 |
+
"cluster_name": "cluster_sproject3",
|
| 179 |
+
"conf": "/etc/slurm/slurm.conf",
|
| 180 |
+
"cpus_on_node": "2",
|
| 181 |
+
"gtids": "0",
|
| 182 |
+
"job_account": "research",
|
| 183 |
+
"job_cpus_per_node": "2",
|
| 184 |
+
"job_gid": "800000689",
|
| 185 |
+
"job_gpus": "0,1,2,6",
|
| 186 |
+
"job_id": "8574598",
|
| 187 |
+
"job_name": "qwen3_asr_train_4gpu",
|
| 188 |
+
"job_nodelist": "SH-IDC1-10-140-37-95",
|
| 189 |
+
"job_num_nodes": "1",
|
| 190 |
+
"job_partition": "interntmp",
|
| 191 |
+
"job_qos": "normal",
|
| 192 |
+
"job_uid": "800000689",
|
| 193 |
+
"job_user": "panjiabao",
|
| 194 |
+
"jobid": "8574598",
|
| 195 |
+
"localid": "0",
|
| 196 |
+
"nnodes": "1",
|
| 197 |
+
"node_aliases": "(null)",
|
| 198 |
+
"nodeid": "0",
|
| 199 |
+
"nodelist": "SH-IDC1-10-140-37-95",
|
| 200 |
+
"nprocs": "1",
|
| 201 |
+
"ntasks": "1",
|
| 202 |
+
"prio_process": "0",
|
| 203 |
+
"procid": "0",
|
| 204 |
+
"submit_dir": "/mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/0416upload",
|
| 205 |
+
"submit_host": "SH-IDC1-10-140-37-164",
|
| 206 |
+
"task_pid": "9466",
|
| 207 |
+
"tasks_per_node": "1",
|
| 208 |
+
"topology_addr": "SH-IDC1-10-140-37-95",
|
| 209 |
+
"topology_addr_pattern": "node",
|
| 210 |
+
"working_cluster": "cluster_sproject3:SH-IDC1-10-140-37-161:6817:9216:109"
|
| 211 |
+
},
|
| 212 |
+
"writerId": "ess1zs9oqcfvbaak4xbqvnst142xqp1g"
|
| 213 |
+
}
|
wandb/run-20260418_172847-c2a5hfz3/files/wandb-summary.json
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"train/completions/max_length":374.1,"eval/kl":0.5471468614941498,"profiling/Time taken: GRPOTrainer.resample_encode_failed_inputs":0.10830203304067254,"profiling/Time taken: GRPOTrainer.generate":2.985434970119968,"eval/clip_ratio/region_mean":0,"train/reward_std":0.18413368090987206,"profiling/Time taken: GRPOTrainer._prepare_batch_inputs":1.4252209290862083,"eval/loss":0.023608719930052757,"train/clip_ratio/low_min":0.002832426130771637,"eval/frac_reward_zero_std":0.15566037735849056,"eval/rewards/ASRWerSubLenCmpHalluDirtyV56/std":0.5037064297862772,"train/clip_ratio/high_mean":0.013257157216624666,"eval/samples_per_second":1.028,"_wandb":{"runtime":167801},"train/global_step":1200,"train/kl":0.7693365861972173,"eval/steps_per_second":0.067,"eval/runtime":208.2116,"profiling/Time taken: GRPOTrainer.compute_loss":0.3779073969926685,"train/rewards/ASRWerSubLenCmpHalluDirtyV56/mean":0.16251326091587542,"eval/reward_std":0.1169186263643908,"profiling/Time taken: GRPOTrainer._generate_and_score_completions":5.926984405843541,"eval/clip_ratio/low_mean":0,"eval/clip_ratio/high_mean":0,"train/clip_ratio/high_max":0.028729480388574303,"profiling/Time taken: GRPOTrainer.ASRWerSubLenCmpHalluDirtyV56":0.06905108108185232,"profiling/Time taken: GRPOTrainer.log_metrics":0.022023104829713702,"train/clip_ratio/region_mean":0.028791408023486533,"train/frac_reward_zero_std":0,"eval/reward":0.4663126377283402,"eval/completions/mean_length":45.948113207547166,"train/completions/clipped_ratio":0.004166666666666667,"eval/clip_ratio/low_min":0,"eval/completions/clipped_ratio":0,"profiling/Time taken: GRPOTrainer._get_per_token_logps_and_entropies":0.3741553670261055,"train/clip_ratio/low_mean":0.015534250618657097,"eval/clip_ratio/high_max":0,"_step":598,"train/learning_rate":4.87350326370979e-05,"train/step_time":50.95165289340075,"eval/completions/max_length":59.15094339622642,"completions":{"size":31217,"ncols":6,"artifact_path":"wandb-client-artifact://jli2kdi7ef7w5pgm5t5mfpancx9qoq5net2vqru9ku5vuevkioj6uoqgmy6ojheyps4eavp8glqspzt63cid5rz59ib1yfz438dry4cbc1rcrle1x0kc6u6baofnvzp5/completions.table.json","_type":"table-file","sha256":"15ac642a65a06a04c3f33750733a3b61b5c428d4f70e069739b3c7df835ae44d","_latest_artifact_path":"wandb-client-artifact://mm4npojrnrffcjkkzw46vtbqn9bp7hms1vx6ohyncuuv16yny2waqf8rilfjn20oz6zu5pl07fwb5wqd7m6kprccayx2errp2xqtifzi27gnfukness54t79wm4t5agy:latest/completions.table.json","log_mode":"IMMUTABLE","nrows":48,"path":"media/table/completions_597_15ac642a65a06a04c3f3.table.json"},"profiling/Time taken: GRPOTrainer._score_completions":0.06985888280905783,"train/reward":0.1625132780522108,"_runtime":167801,"_timestamp":1.776672310555167e+09,"train/grad_norm":0.4121144711971283,"train/rewards/ASRWerSubLenCmpHalluDirtyV56/std":0.43018959313631056,"eval/rewards/ASRWerSubLenCmpHalluDirtyV56/mean":0.4663126377283402,"train/completions/mean_length":52.735418701171874,"train/completions/min_length":29.85,"train/epoch":0.3859761981344484,"train/loss":0.01593678444623947,"profiling/Time taken: GRPOTrainer._dynamic_sampling":1.2856517911422998,"eval/completions/min_length":30.39622641509434,"profiling/Time taken: GRPOTrainer._prepare_inputs":6.024027243256569e-06}
|
wandb/run-20260418_172847-c2a5hfz3/logs/debug-internal.log
ADDED
|
@@ -0,0 +1,72 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{"time":"2026-04-18T17:28:47.877484976+08:00","level":"INFO","msg":"stream: starting","core version":"0.23.0"}
|
| 2 |
+
{"time":"2026-04-18T17:28:48.347618035+08:00","level":"INFO","msg":"stream: created new stream","id":"c2a5hfz3"}
|
| 3 |
+
{"time":"2026-04-18T17:28:48.347701352+08:00","level":"INFO","msg":"handler: started","stream_id":"c2a5hfz3"}
|
| 4 |
+
{"time":"2026-04-18T17:28:48.350844585+08:00","level":"INFO","msg":"stream: started","id":"c2a5hfz3"}
|
| 5 |
+
{"time":"2026-04-18T17:28:48.350849894+08:00","level":"INFO","msg":"writer: started","stream_id":"c2a5hfz3"}
|
| 6 |
+
{"time":"2026-04-18T17:28:48.350854798+08:00","level":"INFO","msg":"sender: started","stream_id":"c2a5hfz3"}
|
| 7 |
+
{"time":"2026-04-18T17:37:33.858258418+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/pang_kaiyu-none/qwen3_asr_swift_dapo/c2a5hfz3/file_stream\": unexpected EOF"}
|
| 8 |
+
{"time":"2026-04-19T02:34:07.470718868+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/pang_kaiyu-none/qwen3_asr_swift_dapo/c2a5hfz3/file_stream\": unexpected EOF"}
|
| 9 |
+
{"time":"2026-04-19T02:38:39.32386773+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/pang_kaiyu-none/qwen3_asr_swift_dapo/c2a5hfz3/file_stream\": http2: client conn could not be established"}
|
| 10 |
+
{"time":"2026-04-19T02:40:17.658933776+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/pang_kaiyu-none/qwen3_asr_swift_dapo/c2a5hfz3/file_stream\": unexpected EOF"}
|
| 11 |
+
{"time":"2026-04-19T02:43:03.564180775+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/pang_kaiyu-none/qwen3_asr_swift_dapo/c2a5hfz3/file_stream\": unexpected EOF"}
|
| 12 |
+
{"time":"2026-04-19T02:44:49.518795314+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/pang_kaiyu-none/qwen3_asr_swift_dapo/c2a5hfz3/file_stream\": unexpected EOF"}
|
| 13 |
+
{"time":"2026-04-19T02:45:08.529740538+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/pang_kaiyu-none/qwen3_asr_swift_dapo/c2a5hfz3/file_stream\": unexpected EOF"}
|
| 14 |
+
{"time":"2026-04-19T02:46:20.848321936+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/pang_kaiyu-none/qwen3_asr_swift_dapo/c2a5hfz3/file_stream\": unexpected EOF"}
|
| 15 |
+
{"time":"2026-04-19T02:49:05.639172159+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/pang_kaiyu-none/qwen3_asr_swift_dapo/c2a5hfz3/file_stream\": unexpected EOF"}
|
| 16 |
+
{"time":"2026-04-19T15:09:49.426045163+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/pang_kaiyu-none/qwen3_asr_swift_dapo/c2a5hfz3/file_stream\": unexpected EOF"}
|
| 17 |
+
{"time":"2026-04-19T15:57:04.347389276+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/pang_kaiyu-none/qwen3_asr_swift_dapo/c2a5hfz3/file_stream\": unexpected EOF"}
|
| 18 |
+
{"time":"2026-04-19T16:02:30.488210102+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/pang_kaiyu-none/qwen3_asr_swift_dapo/c2a5hfz3/file_stream\": unexpected EOF"}
|
| 19 |
+
{"time":"2026-04-19T22:07:33.03303113+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/pang_kaiyu-none/qwen3_asr_swift_dapo/c2a5hfz3/file_stream\": unexpected EOF"}
|
| 20 |
+
{"time":"2026-04-19T22:07:51.98901393+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/pang_kaiyu-none/qwen3_asr_swift_dapo/c2a5hfz3/file_stream\": unexpected EOF"}
|
| 21 |
+
{"time":"2026-04-19T22:08:16.035247515+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/pang_kaiyu-none/qwen3_asr_swift_dapo/c2a5hfz3/file_stream\": unexpected EOF"}
|
| 22 |
+
{"time":"2026-04-19T22:09:42.186767689+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/pang_kaiyu-none/qwen3_asr_swift_dapo/c2a5hfz3/file_stream\": unexpected EOF"}
|
| 23 |
+
{"time":"2026-04-19T22:24:00.480169619+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/pang_kaiyu-none/qwen3_asr_swift_dapo/c2a5hfz3/file_stream\": unexpected EOF"}
|
| 24 |
+
{"time":"2026-04-19T22:24:34.690158146+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/pang_kaiyu-none/qwen3_asr_swift_dapo/c2a5hfz3/file_stream\": unexpected EOF"}
|
| 25 |
+
{"time":"2026-04-19T22:28:36.622066809+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/pang_kaiyu-none/qwen3_asr_swift_dapo/c2a5hfz3/file_stream\": unexpected EOF"}
|
| 26 |
+
{"time":"2026-04-19T22:28:59.75540152+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/pang_kaiyu-none/qwen3_asr_swift_dapo/c2a5hfz3/file_stream\": unexpected EOF"}
|
| 27 |
+
{"time":"2026-04-19T22:31:22.975036457+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/pang_kaiyu-none/qwen3_asr_swift_dapo/c2a5hfz3/file_stream\": unexpected EOF"}
|
| 28 |
+
{"time":"2026-04-19T22:34:17.890202383+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/pang_kaiyu-none/qwen3_asr_swift_dapo/c2a5hfz3/file_stream\": unexpected EOF"}
|
| 29 |
+
{"time":"2026-04-19T22:43:21.155119859+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/pang_kaiyu-none/qwen3_asr_swift_dapo/c2a5hfz3/file_stream\": unexpected EOF"}
|
| 30 |
+
{"time":"2026-04-19T22:43:38.33530735+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/pang_kaiyu-none/qwen3_asr_swift_dapo/c2a5hfz3/file_stream\": unexpected EOF"}
|
| 31 |
+
{"time":"2026-04-19T22:46:03.44895843+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/pang_kaiyu-none/qwen3_asr_swift_dapo/c2a5hfz3/file_stream\": unexpected EOF"}
|
| 32 |
+
{"time":"2026-04-19T22:48:50.248056745+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/pang_kaiyu-none/qwen3_asr_swift_dapo/c2a5hfz3/file_stream\": unexpected EOF"}
|
| 33 |
+
{"time":"2026-04-19T22:49:48.447601198+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/pang_kaiyu-none/qwen3_asr_swift_dapo/c2a5hfz3/file_stream\": unexpected EOF"}
|
| 34 |
+
{"time":"2026-04-19T22:52:35.56119014+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/pang_kaiyu-none/qwen3_asr_swift_dapo/c2a5hfz3/file_stream\": unexpected EOF"}
|
| 35 |
+
{"time":"2026-04-19T22:52:50.371922946+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/pang_kaiyu-none/qwen3_asr_swift_dapo/c2a5hfz3/file_stream\": unexpected EOF"}
|
| 36 |
+
{"time":"2026-04-19T22:56:30.747794336+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/pang_kaiyu-none/qwen3_asr_swift_dapo/c2a5hfz3/file_stream\": unexpected EOF"}
|
| 37 |
+
{"time":"2026-04-19T22:58:32.547706574+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/pang_kaiyu-none/qwen3_asr_swift_dapo/c2a5hfz3/file_stream\": unexpected EOF"}
|
| 38 |
+
{"time":"2026-04-19T23:00:23.617563694+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/pang_kaiyu-none/qwen3_asr_swift_dapo/c2a5hfz3/file_stream\": unexpected EOF"}
|
| 39 |
+
{"time":"2026-04-19T23:00:37.717734501+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/pang_kaiyu-none/qwen3_asr_swift_dapo/c2a5hfz3/file_stream\": unexpected EOF"}
|
| 40 |
+
{"time":"2026-04-19T23:05:31.94573349+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/pang_kaiyu-none/qwen3_asr_swift_dapo/c2a5hfz3/file_stream\": unexpected EOF"}
|
| 41 |
+
{"time":"2026-04-19T23:05:44.893259249+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/pang_kaiyu-none/qwen3_asr_swift_dapo/c2a5hfz3/file_stream\": unexpected EOF"}
|
| 42 |
+
{"time":"2026-04-20T00:03:04.382543732+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/pang_kaiyu-none/qwen3_asr_swift_dapo/c2a5hfz3/file_stream\": unexpected EOF"}
|
| 43 |
+
{"time":"2026-04-20T00:03:19.501053157+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/pang_kaiyu-none/qwen3_asr_swift_dapo/c2a5hfz3/file_stream\": unexpected EOF"}
|
| 44 |
+
{"time":"2026-04-20T00:05:31.556601347+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/pang_kaiyu-none/qwen3_asr_swift_dapo/c2a5hfz3/file_stream\": unexpected EOF"}
|
| 45 |
+
{"time":"2026-04-20T00:06:03.495128433+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/pang_kaiyu-none/qwen3_asr_swift_dapo/c2a5hfz3/file_stream\": unexpected EOF"}
|
| 46 |
+
{"time":"2026-04-20T00:11:23.73287074+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/pang_kaiyu-none/qwen3_asr_swift_dapo/c2a5hfz3/file_stream\": unexpected EOF"}
|
| 47 |
+
{"time":"2026-04-20T02:58:43.522847172+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/graphql\": net/http: request canceled (Client.Timeout exceeded while awaiting headers)"}
|
| 48 |
+
{"time":"2026-04-20T02:59:04.598457045+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/pang_kaiyu-none/qwen3_asr_swift_dapo/c2a5hfz3/file_stream\": context deadline exceeded"}
|
| 49 |
+
{"time":"2026-04-20T02:59:15.733502761+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/graphql\": context deadline exceeded (Client.Timeout exceeded while awaiting headers)"}
|
| 50 |
+
{"time":"2026-04-20T02:59:49.917399553+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/graphql\": context deadline exceeded (Client.Timeout exceeded while awaiting headers)"}
|
| 51 |
+
{"time":"2026-04-20T03:00:07.058218433+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/pang_kaiyu-none/qwen3_asr_swift_dapo/c2a5hfz3/file_stream\": context deadline exceeded"}
|
| 52 |
+
{"time":"2026-04-20T03:00:29.606621937+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/graphql\": net/http: request canceled (Client.Timeout exceeded while awaiting headers)"}
|
| 53 |
+
{"time":"2026-04-20T03:00:34.624296643+08:00","level":"INFO","msg":"flowcontrol: backed up, offloading to disk","recordNumber":124381}
|
| 54 |
+
{"time":"2026-04-20T03:00:46.264621657+08:00","level":"INFO","msg":"flowcontrol: unblocked","totalOffloaded":1}
|
| 55 |
+
{"time":"2026-04-20T03:44:43.734398398+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/graphql\": context deadline exceeded (Client.Timeout exceeded while awaiting headers)"}
|
| 56 |
+
{"time":"2026-04-20T04:11:48.762158534+08:00","level":"INFO","msg":"api: retrying HTTP error","status":503,"url":"https://api.wandb.ai/graphql","body":"upstream connect error or disconnect/reset before headers. reset reason: connection termination"}
|
| 57 |
+
{"time":"2026-04-20T04:13:58.74920069+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/graphql\": net/http: request canceled (Client.Timeout exceeded while awaiting headers)"}
|
| 58 |
+
{"time":"2026-04-20T06:34:34.21211755+08:00","level":"INFO","msg":"api: retrying HTTP error","status":503,"url":"https://api.wandb.ai/graphql","body":"upstream connect error or disconnect/reset before headers. reset reason: connection termination"}
|
| 59 |
+
{"time":"2026-04-20T10:50:53.628901466+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/pang_kaiyu-none/qwen3_asr_swift_dapo/c2a5hfz3/file_stream\": unexpected EOF"}
|
| 60 |
+
{"time":"2026-04-20T16:00:42.158363018+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/pang_kaiyu-none/qwen3_asr_swift_dapo/c2a5hfz3/file_stream\": unexpected EOF"}
|
| 61 |
+
{"time":"2026-04-20T16:02:08.101875007+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/pang_kaiyu-none/qwen3_asr_swift_dapo/c2a5hfz3/file_stream\": unexpected EOF"}
|
| 62 |
+
{"time":"2026-04-20T16:03:45.141714956+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/pang_kaiyu-none/qwen3_asr_swift_dapo/c2a5hfz3/file_stream\": unexpected EOF"}
|
| 63 |
+
{"time":"2026-04-20T16:04:52.17332644+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/pang_kaiyu-none/qwen3_asr_swift_dapo/c2a5hfz3/file_stream\": unexpected EOF"}
|
| 64 |
+
{"time":"2026-04-20T16:05:06.320377956+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/pang_kaiyu-none/qwen3_asr_swift_dapo/c2a5hfz3/file_stream\": unexpected EOF"}
|
| 65 |
+
{"time":"2026-04-20T16:05:29.800728083+08:00","level":"ERROR","msg":"sender: sendStopStatus: failed to get run stopped status: context deadline exceeded (Client.Timeout or context cancellation while reading body)"}
|
| 66 |
+
{"time":"2026-04-20T16:05:30.799799131+08:00","level":"INFO","msg":"stream: closing","id":"c2a5hfz3"}
|
| 67 |
+
{"time":"2026-04-20T16:05:39.191906442+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/pang_kaiyu-none/qwen3_asr_swift_dapo/c2a5hfz3/file_stream\": unexpected EOF"}
|
| 68 |
+
{"time":"2026-04-20T16:05:43.710909983+08:00","level":"INFO","msg":"fileTransfer: Close: file transfer manager closed"}
|
| 69 |
+
{"time":"2026-04-20T16:06:10.469686843+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/pang_kaiyu-none/qwen3_asr_swift_dapo/c2a5hfz3/file_stream\": unexpected EOF"}
|
| 70 |
+
{"time":"2026-04-20T16:06:17.397266507+08:00","level":"INFO","msg":"handler: closed","stream_id":"c2a5hfz3"}
|
| 71 |
+
{"time":"2026-04-20T16:06:17.400263519+08:00","level":"INFO","msg":"sender: closed","stream_id":"c2a5hfz3"}
|
| 72 |
+
{"time":"2026-04-20T16:06:17.40028542+08:00","level":"INFO","msg":"stream: closed","id":"c2a5hfz3"}
|
wandb/run-20260418_172847-c2a5hfz3/logs/debug.log
ADDED
|
@@ -0,0 +1,26 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
2026-04-18 17:28:47,491 INFO MainThread:10295 [wandb_setup.py:_flush():80] Current SDK version is 0.23.0
|
| 2 |
+
2026-04-18 17:28:47,491 INFO MainThread:10295 [wandb_setup.py:_flush():80] Configure stats pid to 10295
|
| 3 |
+
2026-04-18 17:28:47,491 INFO MainThread:10295 [wandb_setup.py:_flush():80] Loading settings from /mnt/petrelfs/panjiabao/.config/wandb/settings
|
| 4 |
+
2026-04-18 17:28:47,491 INFO MainThread:10295 [wandb_setup.py:_flush():80] Loading settings from /mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/0416upload/wandb/settings
|
| 5 |
+
2026-04-18 17:28:47,491 INFO MainThread:10295 [wandb_setup.py:_flush():80] Loading settings from environment variables
|
| 6 |
+
2026-04-18 17:28:47,491 INFO MainThread:10295 [wandb_init.py:setup_run_log_directory():713] Logging user logs to /mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/0416upload/wandb/run-20260418_172847-c2a5hfz3/logs/debug.log
|
| 7 |
+
2026-04-18 17:28:47,491 INFO MainThread:10295 [wandb_init.py:setup_run_log_directory():714] Logging internal logs to /mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/0416upload/wandb/run-20260418_172847-c2a5hfz3/logs/debug-internal.log
|
| 8 |
+
2026-04-18 17:28:47,491 INFO MainThread:10295 [wandb_init.py:init():840] calling init triggers
|
| 9 |
+
2026-04-18 17:28:47,491 INFO MainThread:10295 [wandb_init.py:init():845] wandb.init called with sweep_config: {}
|
| 10 |
+
config: {'_wandb': {}}
|
| 11 |
+
2026-04-18 17:28:47,491 INFO MainThread:10295 [wandb_init.py:init():888] starting backend
|
| 12 |
+
2026-04-18 17:28:47,865 INFO MainThread:10295 [wandb_init.py:init():891] sending inform_init request
|
| 13 |
+
2026-04-18 17:28:47,870 INFO MainThread:10295 [wandb_init.py:init():899] backend started and connected
|
| 14 |
+
2026-04-18 17:28:47,874 INFO MainThread:10295 [wandb_init.py:init():969] updated telemetry
|
| 15 |
+
2026-04-18 17:28:47,875 INFO MainThread:10295 [wandb_init.py:init():993] communicating run to backend with 90.0 second timeout
|
| 16 |
+
2026-04-18 17:28:49,589 INFO MainThread:10295 [wandb_init.py:init():1040] starting run threads in backend
|
| 17 |
+
2026-04-18 17:28:50,217 INFO MainThread:10295 [wandb_run.py:_console_start():2504] atexit reg
|
| 18 |
+
2026-04-18 17:28:50,218 INFO MainThread:10295 [wandb_run.py:_redirect():2352] redirect: wrap_raw
|
| 19 |
+
2026-04-18 17:28:50,218 INFO MainThread:10295 [wandb_run.py:_redirect():2421] Wrapping output streams.
|
| 20 |
+
2026-04-18 17:28:50,218 INFO MainThread:10295 [wandb_run.py:_redirect():2444] Redirects installed.
|
| 21 |
+
2026-04-18 17:28:50,224 INFO MainThread:10295 [wandb_init.py:init():1080] run started, returning control to user process
|
| 22 |
+
2026-04-18 17:28:50,229 INFO MainThread:10295 [wandb_run.py:_config_callback():1385] config_cb None None {'peft_config': {'default': {'task_type': 'CAUSAL_LM', 'peft_type': 'LORA', 'auto_mapping': None, 'peft_version': '0.18.1', 'base_model_name_or_path': '/mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/qwen3-asr-merged', 'revision': None, 'inference_mode': False, 'r': 8, 'target_modules': '^(thinker\\.model(?=\\.).*\\.(up_proj|q_proj|o_proj|gate_proj|k_proj|v_proj|down_proj)|thinker\\.audio_tower\\.layers(?=\\.).*\\.(q_proj|fc1|out_proj|k_proj|v_proj|fc2)|thinker\\.audio_tower\\.conv_out(?=\\.)|thinker\\.audio_tower\\.proj1(?=\\.)|thinker\\.audio_tower\\.proj2(?=\\.))$', 'exclude_modules': None, 'lora_alpha': 32, 'lora_dropout': 0.05, 'fan_in_fan_out': False, 'bias': 'none', 'use_rslora': False, 'modules_to_save': [], 'init_lora_weights': True, 'layers_to_transform': None, 'layers_pattern': None, 'rank_pattern': {}, 'alpha_pattern': {}, 'megatron_config': None, 'megatron_core': 'megatron.core', 'trainable_token_indices': None, 'loftq_config': {}, 'eva_config': None, 'corda_config': None, 'use_dora': False, 'alora_invocation_tokens': None, 'use_qalora': False, 'qalora_group_size': 16, 'layer_replication': None, 'runtime_config': {'ephemeral_gpu_offload': False}, 'lora_bias': False, 'target_parameters': None, 'arrow_config': None, 'ensure_weight_tying': False, 'lora_dtype': None, 'lorap_lr_ratio': None, 'lorap_emb_lr': 1e-06}}, 'return_dict': True, 'output_hidden_states': False, 'torchscript': False, 'dtype': 'bfloat16', 'pruned_heads': {}, 'tie_word_embeddings': True, 'chunk_size_feed_forward': 0, 'is_encoder_decoder': False, 'is_decoder': False, 'cross_attention_hidden_size': None, 'add_cross_attention': False, 'tie_encoder_decoder': False, 'architectures': ['Qwen3ASRForConditionalGeneration'], 'finetuning_task': None, 'id2label': {0: 'LABEL_0', 1: 'LABEL_1'}, 'label2id': {'LABEL_0': 0, 'LABEL_1': 1}, 'task_specific_params': None, 'problem_type': None, 'tokenizer_class': None, 'prefix': None, 'bos_token_id': None, 'pad_token_id': 151643, 'eos_token_id': 151645, 'sep_token_id': None, 'decoder_start_token_id': None, 'max_length': 20, 'min_length': 0, 'do_sample': False, 'early_stopping': False, 'num_beams': 1, 'temperature': 0.5, 'top_k': 50, 'top_p': 0.95, 'typical_p': 1.0, 'repetition_penalty': 1.08, 'length_penalty': 1.0, 'no_repeat_ngram_size': 0, 'encoder_no_repeat_ngram_size': 0, 'bad_words_ids': None, 'num_return_sequences': 1, 'output_scores': False, 'return_dict_in_generate': False, 'forced_bos_token_id': None, 'forced_eos_token_id': None, 'remove_invalid_values': False, 'exponential_decay_length_penalty': None, 'suppress_tokens': None, 'begin_suppress_tokens': None, 'num_beam_groups': 1, 'diversity_penalty': 0.0, '_name_or_path': '/mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/qwen3-asr-merged', 'transformers_version': '4.57.6', 'model_type': 'qwen3_asr', 'tf_legacy_loss': False, 'use_bfloat16': False, 'thinker_config': {'return_dict': True, 'output_hidden_states': False, 'torchscript': False, 'dtype': 'bfloat16', 'pruned_heads': {}, 'tie_word_embeddings': True, 'chunk_size_feed_forward': 0, 'is_encoder_decoder': False, 'is_decoder': False, 'cross_attention_hidden_size': None, 'add_cross_attention': False, 'tie_encoder_decoder': False, 'architectures': ['Qwen3ASRForConditionalGeneration'], 'finetuning_task': None, 'id2label': {0: 'LABEL_0', 1: 'LABEL_1'}, 'label2id': {'LABEL_0': 0, 'LABEL_1': 1}, 'task_specific_params': None, 'problem_type': None, 'tokenizer_class': None, 'prefix': None, 'bos_token_id': None, 'pad_token_id': None, 'eos_token_id': None, 'sep_token_id': None, 'decoder_start_token_id': None, 'max_length': 20, 'min_length': 0, 'do_sample': False, 'early_stopping': False, 'num_beams': 1, 'temperature': 1.0, 'top_k': 50, 'top_p': 1.0, 'typical_p': 1.0, 'repetition_penalty': 1.0, 'length_penalty': 1.0, 'no_repeat_ngram_size': 0, 'encoder_no_repeat_ngram_size': 0, 'bad_words_ids': None, 'num_return_sequences': 1, 'output_scores': False, 'return_dict_in_generate': False, 'forced_bos_token_id': None, 'forced_eos_token_id': None, 'remove_invalid_values': False, 'exponential_decay_length_penalty': None, 'suppress_tokens': None, 'begin_suppress_tokens': None, 'num_beam_groups': 1, 'diversity_penalty': 0.0, '_name_or_path': '', 'audio_end_token_id': 151670, 'model_type': 'qwen3_asr_thinker', 'tf_legacy_loss': False, 'use_bfloat16': False, 'user_token_id': 872, 'audio_start_token_id': 151669, 'initializer_range': 0.02, 'audio_config': {'return_dict': True, 'output_hidden_states': False, 'torchscript': False, 'dtype': None, 'pruned_heads': {}, 'tie_word_embeddings': True, 'chunk_size_feed_forward': 0, 'is_encoder_decoder': False, 'is_decoder': False, 'cross_attention_hidden_size': None, 'add_cross_attention': False, 'tie_encoder_decoder': False, 'architectures': None, 'finetuning_task': None, 'id2label': {0: 'LABEL_0', 1: 'LABEL_1'}, 'label2id': {'LABEL_0': 0, 'LABEL_1': 1}, 'task_specific_params': None, 'problem_type': None, 'tokenizer_class': None, 'prefix': None, 'bos_token_id': None, 'pad_token_id': None, 'eos_token_id': None, 'sep_token_id': None, 'decoder_start_token_id': None, 'max_length': 20, 'min_length': 0, 'do_sample': False, 'early_stopping': False, 'num_beams': 1, 'temperature': 1.0, 'top_k': 50, 'top_p': 1.0, 'typical_p': 1.0, 'repetition_penalty': 1.0, 'length_penalty': 1.0, 'no_repeat_ngram_size': 0, 'encoder_no_repeat_ngram_size': 0, 'bad_words_ids': None, 'num_return_sequences': 1, 'output_scores': False, 'return_dict_in_generate': False, 'forced_bos_token_id': None, 'forced_eos_token_id': None, 'remove_invalid_values': False, 'exponential_decay_length_penalty': None, 'suppress_tokens': None, 'begin_suppress_tokens': None, 'num_beam_groups': 1, 'diversity_penalty': 0.0, '_name_or_path': '', 'model_type': 'qwen3_asr_audio_encoder', 'num_hidden_layers': 24, 'tf_legacy_loss': False, 'use_bfloat16': False, 'num_mel_bins': 128, 'd_model': 1024, 'encoder_layers': 24, 'encoder_attention_heads': 16, 'encoder_ffn_dim': 4096, 'dropout': 0, 'attention_dropout': 0, 'activation_function': 'gelu', 'activation_dropout': 0, 'initializer_range': 0.02, 'scale_embedding': False, 'max_source_positions': 1500, 'n_window': 50, 'output_dim': 2048, 'n_window_infer': 800, 'conv_chunksize': 500, 'downsample_hidden_size': 480, 'output_attentions': False}, 'text_config': {'vocab_size': 151936, 'max_position_embeddings': 65536, 'hidden_size': 2048, 'intermediate_size': 6144, 'num_hidden_layers': 28, 'num_attention_heads': 16, 'num_key_value_heads': 8, 'head_dim': 128, 'hidden_act': 'silu', 'initializer_range': 0.02, 'rms_norm_eps': 1e-06, 'use_cache': False, 'rope_theta': 1000000, 'rope_scaling': {'interleaved': True, 'mrope_interleaved': True, 'mrope_section': [24, 20, 20], 'rope_type': 'default', 'type': 'default'}, 'attention_bias': False, 'attention_dropout': 0.0, 'return_dict': True, 'output_hidden_states': False, 'torchscript': False, 'dtype': None, 'pruned_heads': {}, 'tie_word_embeddings': True, 'chunk_size_feed_forward': 0, 'is_encoder_decoder': False, 'is_decoder': False, 'cross_attention_hidden_size': None, 'add_cross_attention': False, 'tie_encoder_decoder': False, 'architectures': None, 'finetuning_task': None, 'id2label': {0: 'LABEL_0', 1: 'LABEL_1'}, 'label2id': {'LABEL_0': 0, 'LABEL_1': 1}, 'task_specific_params': None, 'problem_type': None, 'tokenizer_class': None, 'prefix': None, 'bos_token_id': None, 'pad_token_id': 151643, 'eos_token_id': None, 'sep_token_id': None, 'decoder_start_token_id': None, 'max_length': 20, 'min_length': 0, 'do_sample': False, 'early_stopping': False, 'num_beams': 1, 'temperature': 1.0, 'top_k': 50, 'top_p': 1.0, 'typical_p': 1.0, 'repetition_penalty': 1.0, 'length_penalty': 1.0, 'no_repeat_ngram_size': 0, 'encoder_no_repeat_ngram_size': 0, 'bad_words_ids': None, 'num_return_sequences': 1, 'output_scores': False, 'return_dict_in_generate': False, 'forced_bos_token_id': None, 'forced_eos_token_id': None, 'remove_invalid_values': False, 'exponential_decay_length_penalty': None, 'suppress_tokens': None, 'begin_suppress_tokens': None, 'num_beam_groups': 1, 'diversity_penalty': 0.0, '_name_or_path': '', 'model_type': 'qwen3_asr_text', 'tf_legacy_loss': False, 'use_bfloat16': False, 'output_attentions': False}, 'audio_token_id': 151676, 'output_attentions': False}, 'support_languages': ['Chinese', 'English', 'Cantonese', 'Arabic', 'German', 'French', 'Spanish', 'Portuguese', 'Indonesian', 'Italian', 'Korean', 'Russian', 'Thai', 'Vietnamese', 'Japanese', 'Turkish', 'Hindi', 'Malay', 'Dutch', 'Swedish', 'Danish', 'Finnish', 'Polish', 'Czech', 'Filipino', 'Persian', 'Greek', 'Romanian', 'Hungarian', 'Macedonian'], 'output_attentions': False, 'output_dir': '/mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/0416upload/out/qwen3asr_dapo_reward56_4x4x12_12gen_4GPU/v5-20260418-172837', 'overwrite_output_dir': False, 'do_train': False, 'do_eval': True, 'do_predict': False, 'eval_strategy': 'steps', 'prediction_loss_only': False, 'per_device_train_batch_size': 4, 'per_device_eval_batch_size': 4, 'per_gpu_train_batch_size': None, 'per_gpu_eval_batch_size': None, 'gradient_accumulation_steps': 12, 'eval_accumulation_steps': None, 'eval_delay': 0, 'torch_empty_cache_steps': None, 'learning_rate': 5e-05, 'weight_decay': 0.1, 'adam_beta1': 0.9, 'adam_beta2': 0.95, 'adam_epsilon': 1e-08, 'max_grad_norm': 1.0, 'num_train_epochs': 3.0, 'max_steps': -1, 'lr_scheduler_type': 'cosine', 'lr_scheduler_kwargs': None, 'warmup_ratio': 0.03, 'warmup_steps': 0, 'log_level': 'passive', 'log_level_replica': 'warning', 'log_on_each_node': True, 'logging_dir': '/mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/0416upload/out/qwen3asr_dapo_reward56_4x4x12_12gen_4GPU/v5-20260418-172837/runs', 'logging_strategy': 'steps', 'logging_first_step': True, 'logging_steps': 5, 'logging_nan_inf_filter': True, 'save_strategy': 'steps', 'save_steps': 20, 'save_total_limit': None, 'save_safetensors': True, 'save_on_each_node': False, 'save_only_model': False, 'restore_callback_states_from_checkpoint': False, 'no_cuda': False, 'use_cpu': False, 'use_mps_device': False, 'seed': 42, 'data_seed': 42, 'jit_mode_eval': False, 'bf16': True, 'fp16': False, 'fp16_opt_level': 'O1', 'half_precision_backend': 'auto', 'bf16_full_eval': False, 'fp16_full_eval': False, 'tf32': None, 'local_rank': 0, 'ddp_backend': None, 'tpu_num_cores': None, 'tpu_metrics_debug': False, 'debug': [], 'dataloader_drop_last': True, 'eval_steps': 20, 'dataloader_num_workers': 1, 'dataloader_prefetch_factor': 2, 'past_index': -1, 'run_name': 'qwen3asr_dapo_reward56_4x4x12_12gen_4GPU', 'disable_tqdm': False, 'remove_unused_columns': False, 'label_names': None, 'load_best_model_at_end': False, 'metric_for_best_model': 'loss', 'greater_is_better': False, 'ignore_data_skip': False, 'fsdp': [], 'fsdp_min_num_params': 0, 'fsdp_config': {'min_num_params': 0, 'xla': False, 'xla_fsdp_v2': False, 'xla_fsdp_grad_ckpt': False}, 'fsdp_transformer_layer_cls_to_wrap': None, 'accelerator_config': {'split_batches': False, 'dispatch_batches': False, 'even_batches': True, 'use_seedable_sampler': True, 'non_blocking': False, 'gradient_accumulation_kwargs': None}, 'parallelism_config': None, 'deepspeed': None, 'label_smoothing_factor': 0.0, 'optim': 'adamw_torch', 'optim_args': None, 'adafactor': False, 'group_by_length': False, 'length_column_name': 'length', 'report_to': ['wandb'], 'project': 'huggingface', 'trackio_space_id': 'trackio', 'ddp_find_unused_parameters': None, 'ddp_bucket_cap_mb': None, 'ddp_broadcast_buffers': None, 'dataloader_pin_memory': True, 'dataloader_persistent_workers': False, 'skip_memory_metrics': True, 'use_legacy_prediction_loop': False, 'push_to_hub': False, 'resume_from_checkpoint': None, 'hub_model_id': None, 'hub_strategy': 'every_save', 'hub_token': '<HUB_TOKEN>', 'hub_private_repo': None, 'hub_always_push': False, 'hub_revision': None, 'gradient_checkpointing': False, 'gradient_checkpointing_kwargs': None, 'include_inputs_for_metrics': False, 'include_for_metrics': [], 'eval_do_concat_batches': True, 'fp16_backend': 'auto', 'push_to_hub_model_id': None, 'push_to_hub_organization': None, 'push_to_hub_token': '<PUSH_TO_HUB_TOKEN>', 'mp_parameters': '', 'auto_find_batch_size': False, 'full_determinism': False, 'torchdynamo': None, 'ray_scope': 'last', 'ddp_timeout': 18000000, 'torch_compile': False, 'torch_compile_backend': None, 'torch_compile_mode': None, 'include_tokens_per_second': False, 'include_num_input_tokens_seen': 'no', 'neftune_noise_alpha': None, 'optim_target_modules': None, 'batch_eval_metrics': False, 'eval_on_start': False, 'use_liger_kernel': False, 'liger_kernel_config': None, 'eval_use_gather_object': False, 'average_tokens_across_devices': True, 'model_init_kwargs': None, 'disable_dropout': False, 'cast_lm_head_to_fp32': False, 'num_generations': 12, 'num_generations_eval': 4, 'max_completion_length': 256, 'ds3_gather_for_generation': True, 'shuffle_dataset': True, 'generation_batch_size': 48, 'steps_per_generation': 3, 'min_p': None, 'generation_kwargs': None, 'chat_template_kwargs': None, 'use_transformers_paged': False, 'cache_implementation': None, 'use_vllm': False, 'vllm_mode': None, 'vllm_model_impl': 'vllm', 'vllm_enable_sleep_mode': False, 'vllm_structured_outputs_regex': None, 'vllm_server_base_url': None, 'vllm_server_host': None, 'vllm_server_port': [8000], 'vllm_server_timeout': 240.0, 'vllm_group_port': 51216, 'vllm_gpu_memory_utilization': 0.9, 'vllm_max_model_length': None, 'vllm_tensor_parallel_size': 1, 'beta': 0.04, 'num_iterations': 2, 'epsilon': 0.2, 'delta': None, 'epsilon_high': 0.28, 'sapo_temperature_neg': 1.05, 'sapo_temperature_pos': 1.0, 'importance_sampling_level': 'token', 'reward_weights': None, 'multi_objective_aggregation': 'sum_then_normalize', 'scale_rewards': 'group', 'loss_type': 'dapo', 'mask_truncated_completions': False, 'sync_ref_model': False, 'ref_model_mixup_alpha': 0.6, 'ref_model_sync_steps': 512, 'top_entropy_quantile': 1.0, 'max_tool_calling_iterations': None, 'vllm_importance_sampling_correction': True, 'vllm_importance_sampling_mode': 'sequence_mask', 'vllm_importance_sampling_cap': 3.0, 'off_policy_mask_threshold': None, 'use_bias_correction_kl': False, 'log_completions': True, 'num_completions_to_print': None, 'log_unique_prompts': False, 'log_completions_hub_repo': None, 'tuner_backend': 'peft', 'vit_gradient_checkpointing': True, 'router_aux_loss_coef': 0.0, 'enable_dft_loss': False, 'enable_channel_loss': False, 'safe_serialization': True, 'max_shard_size': '5GB', 'check_model': True, 'acc_strategy': 'token', 'train_dataloader_shuffle': True, 'max_epochs': None, 'aligner_lr': None, 'vit_lr': None, 'use_logits_to_keep': None, 'resume_only_model': False, 'optimizer': None, 'eval_metric': None, 'callbacks': [], 'early_stop_interval': None, 'eval_use_evalscope': False, 'eval_dataset': [], 'eval_dataset_args': None, 'eval_limit': None, 'eval_generation_config': None, 'extra_eval_args': None, 'tuner_type': 'lora', 'use_galore': False, 'galore_target_modules': None, 'galore_rank': 128, 'galore_update_proj_gap': 50, 'galore_scale': 1.0, 'galore_proj_type': 'std', 'galore_optim_per_parameter': False, 'galore_with_embedding': False, 'galore_quantization': False, 'galore_proj_quant': False, 'galore_proj_bits': 4, 'galore_proj_group_size': 256, 'galore_cos_threshold': 0.4, 'galore_gamma_proj': 2, 'galore_queue_size': 5, 'lisa_activated_layers': 0, 'lisa_step_interval': 20, 'use_flash_ckpt': False, 'vllm_pipeline_parallel_size': 1, 'vllm_enable_expert_parallel': False, 'vllm_max_num_seqs': None, 'vllm_max_model_len': None, 'vllm_disable_custom_all_reduce': True, 'vllm_enforce_eager': False, 'vllm_limit_mm_per_prompt': None, 'vllm_max_lora_rank': 16, 'vllm_enable_prefix_caching': True, 'vllm_use_async_engine': None, 'vllm_quantization': None, 'vllm_reasoning_parser': None, 'vllm_disable_cascade_attn': False, 'vllm_mm_processor_cache_gb': None, 'vllm_speculative_config': None, 'vllm_engine_kwargs': {}, 'vllm_data_parallel_size': 1, 'stop_words': [], 'vllm_enable_lora': False, 'lora_rank': 8, 'vllm_server_group_port': None, 'enable_flattened_weight_sync': True, 'async_generate': False, 'structured_outputs_regex': None, 'sleep_level': 0, 'move_model_batches': None, 'offload_optimizer': False, 'offload_model': False, 'wandb_log_unique_prompts': None, 'cosine_min_len_value_wrong': -0.5, 'cosine_max_len_value_wrong': 0.0, 'cosine_min_len_value_correct': 1.0, 'cosine_max_len_value_correct': 0.5, 'cosine_max_len': 256, 'repetition_n_grams': 3, 'repetition_max_penalty': -1.0, 'reward_model': None, 'reward_model_plugin': None, 'chord_sft_dataset': [], 'chord_sft_per_device_train_batch_size': None, 'chord_enable_phi_function': False, 'chord_mu_warmup_steps': None, 'chord_mu_decay_steps': None, 'chord_mu_peak': None, 'chord_mu_valley': None, 'multi_turn_scheduler': None, 'max_turns': None, 'completion_length_limit_scope': 'per_round', 'vllm_server_pass_dataset': False, 'dynamic_sample': True, 'max_resample_times': 4, 'overlong_filter': True, 'soft_max_length': None, 'soft_cache_length': None, 'log_entropy': False, 'tau_pos': 1.0, 'tau_neg': 1.05, 'advantage_estimator': 'grpo', 'kl_in_reward': False, 'dataset_shuffle': True, 'rollout_importance_sampling_mode': None, 'rollout_importance_sampling_threshold': 2.0, 'log_rollout_offpolicy_metrics': False, 'off_policy_sequence_mask_delta': None}
|
| 23 |
+
2026-04-18 17:28:50,239 INFO MainThread:10295 [wandb_config.py:__setitem__():154] [no run ID] config set model/num_parameters = 2050307712 - <bound method Run._config_callback of <wandb.sdk.wandb_run.Run object at 0x7f7e494768f0>>
|
| 24 |
+
2026-04-18 17:28:50,239 INFO MainThread:10295 [wandb_run.py:_config_callback():1385] config_cb model/num_parameters 2050307712 None
|
| 25 |
+
2026-04-20 16:05:30,791 INFO wandb-AsyncioManager-main:10295 [service_client.py:_forward_responses():80] Reached EOF.
|
| 26 |
+
2026-04-20 16:05:30,792 INFO wandb-AsyncioManager-main:10295 [mailbox.py:close():137] Closing mailbox, abandoning 1 handles.
|