Prummn commited on
Commit
03cb542
·
verified ·
1 Parent(s): db9b22e

Add files using upload-large-folder tool

Browse files
Files changed (50) hide show
  1. 0417_reward.py +500 -0
  2. 0417train.sh +75 -0
  3. wandb/debug-internal.log +72 -0
  4. wandb/debug.log +26 -0
  5. wandb/run-20260417_122253-6ntp64iz/files/output.log +0 -0
  6. wandb/run-20260417_122253-6ntp64iz/files/requirements.txt +255 -0
  7. wandb/run-20260417_122253-6ntp64iz/files/wandb-metadata.json +223 -0
  8. wandb/run-20260417_122253-6ntp64iz/files/wandb-summary.json +1 -0
  9. wandb/run-20260417_122253-6ntp64iz/logs/debug-core.log +12 -0
  10. wandb/run-20260417_122253-6ntp64iz/logs/debug-internal.log +7 -0
  11. wandb/run-20260417_122253-6ntp64iz/logs/debug.log +26 -0
  12. wandb/run-20260417_123237-3h84yfea/files/config.yaml +1272 -0
  13. wandb/run-20260417_123237-3h84yfea/files/media/table/completions_1_e5129c1db5b8522d8aa7.table.json +1 -0
  14. wandb/run-20260417_123237-3h84yfea/files/media/table/completions_3_0656117578a4523e0161.table.json +1 -0
  15. wandb/run-20260417_123237-3h84yfea/files/media/table/completions_5_f2bf6a8e887194296a09.table.json +1 -0
  16. wandb/run-20260417_123237-3h84yfea/files/media/table/completions_7_4930391b310cfe338705.table.json +1 -0
  17. wandb/run-20260417_123237-3h84yfea/files/media/table/completions_9_ec21142175e3781c9ddd.table.json +1 -0
  18. wandb/run-20260417_123237-3h84yfea/files/output.log +326 -0
  19. wandb/run-20260417_123237-3h84yfea/files/requirements.txt +255 -0
  20. wandb/run-20260417_123237-3h84yfea/files/wandb-metadata.json +223 -0
  21. wandb/run-20260417_123237-3h84yfea/files/wandb-summary.json +1 -0
  22. wandb/run-20260417_123237-3h84yfea/logs/debug-core.log +14 -0
  23. wandb/run-20260417_123237-3h84yfea/logs/debug-internal.log +14 -0
  24. wandb/run-20260417_123237-3h84yfea/logs/debug.log +26 -0
  25. wandb/run-20260417_125349-3c0s7mq3/files/config.yaml +1273 -0
  26. wandb/run-20260417_125349-3c0s7mq3/files/media/table/completions_1_1de95d5626025fdbb34e.table.json +1 -0
  27. wandb/run-20260417_125349-3c0s7mq3/files/media/table/completions_3_b8120af2e2a4bc038eb5.table.json +1 -0
  28. wandb/run-20260417_125349-3c0s7mq3/files/media/table/completions_5_510c5f07b145276e4210.table.json +1 -0
  29. wandb/run-20260417_125349-3c0s7mq3/files/output.log +76 -0
  30. wandb/run-20260417_125349-3c0s7mq3/files/requirements.txt +255 -0
  31. wandb/run-20260417_125349-3c0s7mq3/files/wandb-metadata.json +224 -0
  32. wandb/run-20260417_125349-3c0s7mq3/files/wandb-summary.json +1 -0
  33. wandb/run-20260417_125349-3c0s7mq3/logs/debug-core.log +11 -0
  34. wandb/run-20260417_125349-3c0s7mq3/logs/debug-internal.log +11 -0
  35. wandb/run-20260417_125349-3c0s7mq3/logs/debug.log +26 -0
  36. wandb/run-20260418_172847-c2a5hfz3/files/config.yaml +1262 -0
  37. wandb/run-20260418_172847-c2a5hfz3/files/media/table/completions_291_2ce0194cf48cadccd2a9.table.json +1 -0
  38. wandb/run-20260418_172847-c2a5hfz3/files/media/table/completions_297_2c3b42b29065c75ff192.table.json +1 -0
  39. wandb/run-20260418_172847-c2a5hfz3/files/media/table/completions_325_dedd0bb2cd2d27e14a92.table.json +1 -0
  40. wandb/run-20260418_172847-c2a5hfz3/files/media/table/completions_331_10c4aed0f625c56bd04d.table.json +1 -0
  41. wandb/run-20260418_172847-c2a5hfz3/files/media/table/completions_335_3461640c297d6819a123.table.json +1 -0
  42. wandb/run-20260418_172847-c2a5hfz3/files/media/table/completions_411_885808c4b4bd708583eb.table.json +1 -0
  43. wandb/run-20260418_172847-c2a5hfz3/files/media/table/completions_43_9ca1008a424f8bb91c1c.table.json +1 -0
  44. wandb/run-20260418_172847-c2a5hfz3/files/media/table/completions_63_9c15897616f0ff0b68b9.table.json +1 -0
  45. wandb/run-20260418_172847-c2a5hfz3/files/output.log +0 -0
  46. wandb/run-20260418_172847-c2a5hfz3/files/requirements.txt +255 -0
  47. wandb/run-20260418_172847-c2a5hfz3/files/wandb-metadata.json +213 -0
  48. wandb/run-20260418_172847-c2a5hfz3/files/wandb-summary.json +1 -0
  49. wandb/run-20260418_172847-c2a5hfz3/logs/debug-internal.log +72 -0
  50. wandb/run-20260418_172847-c2a5hfz3/logs/debug.log +26 -0
0417_reward.py ADDED
@@ -0,0 +1,500 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ # asr_RL_reward_v56_dirty.py
2
+ # -*- coding: utf-8 -*-
3
+
4
+ import re
5
+ import json
6
+ import os
7
+ import time
8
+ from functools import lru_cache
9
+ from collections import Counter
10
+ from typing import Any, Dict, List, Tuple
11
+
12
+ try:
13
+ from swift.rewards import ORM, orms
14
+ except Exception:
15
+ from swift.plugin import ORM, orms
16
+
17
+ from qwen_asr.inference.utils import parse_asr_output
18
+
19
+ _ANSWER_RE = re.compile(r"<answer>(.*?)</answer>", re.S | re.I)
20
+ _REWARD_DEBUG_COUNTER: Dict[str, int] = {}
21
+
22
+
23
+ def _as_bool(x, default: bool = False) -> bool:
24
+ if x is None:
25
+ return default
26
+ if isinstance(x, bool):
27
+ return x
28
+ if isinstance(x, (int, float)):
29
+ return bool(x)
30
+ return str(x).strip().lower() in {"1", "true", "yes", "y", "on"}
31
+
32
+
33
+ def _to_jsonable(x: Any):
34
+ if x is None or isinstance(x, (str, int, float, bool)):
35
+ return x
36
+ if isinstance(x, (list, tuple)):
37
+ return [_to_jsonable(v) for v in x]
38
+ if isinstance(x, dict):
39
+ return {str(k): _to_jsonable(v) for k, v in x.items()}
40
+ return str(x)
41
+
42
+
43
+ def _pick_field(x, i: int):
44
+ if x is None:
45
+ return None
46
+ if isinstance(x, (list, tuple)):
47
+ return x[i] if i < len(x) else None
48
+ return x
49
+
50
+
51
+ def _reward_debug_enabled(kwargs) -> bool:
52
+ if "reward_debug" in kwargs:
53
+ return _as_bool(kwargs.get("reward_debug"), default=False)
54
+ return _as_bool(os.environ.get("ASR_REWARD_DEBUG"), default=False)
55
+
56
+
57
+ def _reward_debug_path(kwargs, reward_name: str) -> str:
58
+ base = kwargs.get("reward_debug_path") or os.environ.get("ASR_REWARD_DEBUG_PATH")
59
+ if not base:
60
+ return ""
61
+ base = str(base)
62
+ if base.endswith(".jsonl"):
63
+ base = base[:-6]
64
+ return f"{base}.{reward_name}.pid{os.getpid()}.jsonl"
65
+
66
+
67
+ def _reward_debug_max_rows(kwargs) -> int:
68
+ x = kwargs.get("reward_debug_max_rows")
69
+ if x is None:
70
+ x = os.environ.get("ASR_REWARD_DEBUG_MAX_ROWS", 1000)
71
+ try:
72
+ x = int(x)
73
+ except Exception:
74
+ x = 1000
75
+ return max(0, x)
76
+
77
+
78
+ def _collect_common_debug_meta(kwargs, i: int) -> Dict[str, Any]:
79
+ fields = [
80
+ "step", "id", "sample_id", "group_id", "utt_id", "audio_id", "audio_path",
81
+ "task", "lang", "language", "base_wer", "base_wer_bucket", "difficulty_bucket", "wer",
82
+ "dirty_type",
83
+ ]
84
+ out = {}
85
+ for k in fields:
86
+ if k in kwargs:
87
+ out[k] = _to_jsonable(_pick_field(kwargs.get(k), i))
88
+ return out
89
+
90
+
91
+ def _append_reward_debug_row(reward_name: str, kwargs, row: Dict[str, Any]) -> None:
92
+ if not _reward_debug_enabled(kwargs):
93
+ return
94
+ path = _reward_debug_path(kwargs, reward_name)
95
+ if not path:
96
+ return
97
+ max_rows = _reward_debug_max_rows(kwargs)
98
+ if max_rows <= 0:
99
+ return
100
+ cur = _REWARD_DEBUG_COUNTER.get(path, 0)
101
+ if cur >= max_rows:
102
+ return
103
+ try:
104
+ parent = os.path.dirname(path)
105
+ if parent:
106
+ os.makedirs(parent, exist_ok=True)
107
+ payload = {
108
+ "ts": time.time(),
109
+ "reward_name": reward_name,
110
+ **_to_jsonable(row),
111
+ }
112
+ with open(path, "a", encoding="utf-8") as f:
113
+ f.write(json.dumps(payload, ensure_ascii=False) + "\n")
114
+ _REWARD_DEBUG_COUNTER[path] = cur + 1
115
+ except Exception:
116
+ pass
117
+
118
+
119
+ def _extract_completion_text(s: str) -> str:
120
+ if s is None:
121
+ return ""
122
+ s = s.strip()
123
+ m = _ANSWER_RE.search(s)
124
+ if m:
125
+ s = m.group(1).strip()
126
+ lower = s.lower()
127
+ for pfx in ["transcription:", "asr:", "answer:", "答案:", "答案:", "识别结果:", "识别结果:"]:
128
+ if lower.startswith(pfx):
129
+ s = s[len(pfx):].strip()
130
+ break
131
+ s = s.replace("<|im_end|>", "").strip()
132
+ try:
133
+ _lang, text = parse_asr_output(s, user_language=None)
134
+ if text:
135
+ s = text
136
+ except Exception:
137
+ pass
138
+ return s
139
+
140
+
141
+ def normalize_text(s: str) -> str:
142
+ return (s or "").strip().lower()
143
+
144
+
145
+ @lru_cache(maxsize=50000)
146
+ def _tokenize_cached(s: str) -> Tuple[str, ...]:
147
+ s = normalize_text(s)
148
+ if not s:
149
+ return tuple()
150
+ if " " in s:
151
+ return tuple(w for w in s.split() if w)
152
+ return tuple(ch for ch in s if not ch.isspace())
153
+
154
+
155
+ def _tokenize(s: str) -> List[str]:
156
+ return list(_tokenize_cached(s))
157
+
158
+
159
+ def _char_seq(s: str) -> List[str]:
160
+ s = normalize_text(s)
161
+ return [ch for ch in s if not ch.isspace()]
162
+
163
+
164
+ def _infer_dirty_type_from_audio(x: Any) -> str:
165
+ if x is None:
166
+ return "other"
167
+ if isinstance(x, (list, tuple)) and len(x) > 0:
168
+ x = x[0]
169
+ s = str(x).lower()
170
+ if "voices" in s:
171
+ return "voices_noise_plus_farfield"
172
+ if "noise+rsp" in s or "resample_noise" in s or ("/noise/" in s and "voices" not in s):
173
+ return "noise_rsp_pure_noise"
174
+ return "other"
175
+
176
+
177
+ def _get_dirty_type(kwargs, i: int) -> str:
178
+ dtype = _pick_field(kwargs.get("dirty_type"), i)
179
+ if dtype is not None:
180
+ s = str(dtype).strip().lower()
181
+ if s in {"voices", "voices_noise_plus_farfield", "voices_far", "voices_farfield"}:
182
+ return "voices_noise_plus_farfield"
183
+ if s in {"noise", "noise_rsp", "noise_rsp_pure_noise", "pure_noise"}:
184
+ return "noise_rsp_pure_noise"
185
+ return s
186
+
187
+ audio_path = _pick_field(kwargs.get("audio_path"), i)
188
+ if audio_path is not None:
189
+ return _infer_dirty_type_from_audio(audio_path)
190
+
191
+ audios = _pick_field(kwargs.get("audios"), i)
192
+ return _infer_dirty_type_from_audio(audios)
193
+
194
+
195
+ def _edit_ops_counts(ref_toks: List[str], hyp_toks: List[str]) -> Tuple[int, int, int]:
196
+ n, m = len(ref_toks), len(hyp_toks)
197
+ dp = [[0] * (m + 1) for _ in range(n + 1)]
198
+ bt = [[0] * (m + 1) for _ in range(n + 1)]
199
+
200
+ for i in range(1, n + 1):
201
+ dp[i][0] = i
202
+ bt[i][0] = 2
203
+ for j in range(1, m + 1):
204
+ dp[0][j] = j
205
+ bt[0][j] = 3
206
+
207
+ for i in range(1, n + 1):
208
+ ri = ref_toks[i - 1]
209
+ for j in range(1, m + 1):
210
+ hj = hyp_toks[j - 1]
211
+ if ri == hj:
212
+ dp[i][j] = dp[i - 1][j - 1]
213
+ bt[i][j] = 0
214
+ else:
215
+ sub = dp[i - 1][j - 1] + 1
216
+ dele = dp[i - 1][j] + 1
217
+ ins = dp[i][j - 1] + 1
218
+ best = min(sub, dele, ins)
219
+ dp[i][j] = best
220
+ if best == sub:
221
+ bt[i][j] = 1
222
+ elif best == dele:
223
+ bt[i][j] = 2
224
+ else:
225
+ bt[i][j] = 3
226
+
227
+ i, j = n, m
228
+ sub = dele = ins = 0
229
+ while i > 0 or j > 0:
230
+ op = bt[i][j]
231
+ if i > 0 and j > 0 and op == 0:
232
+ i -= 1
233
+ j -= 1
234
+ elif i > 0 and j > 0 and op == 1:
235
+ sub += 1
236
+ i -= 1
237
+ j -= 1
238
+ elif i > 0 and op == 2:
239
+ dele += 1
240
+ i -= 1
241
+ else:
242
+ ins += 1
243
+ j -= 1
244
+ return sub, dele, ins
245
+
246
+
247
+ def _char_bigram_f1(hyp: str, ref: str) -> float:
248
+ h = _char_seq(hyp)
249
+ r = _char_seq(ref)
250
+ if not h and not r:
251
+ return 1.0
252
+ if not h or not r:
253
+ return 0.0
254
+ if len(h) < 2 or len(r) < 2:
255
+ inter = sum(1 for x, y in zip(h, r) if x == y)
256
+ p = inter / max(1, len(h))
257
+ rr = inter / max(1, len(r))
258
+ return 2.0 * p * rr / max(1e-8, p + rr)
259
+
260
+ hg = Counter((h[i], h[i + 1]) for i in range(len(h) - 1))
261
+ rg = Counter((r[i], r[i + 1]) for i in range(len(r) - 1))
262
+ inter = sum(min(v, rg[k]) for k, v in hg.items())
263
+ p = inter / max(1, sum(hg.values()))
264
+ rr = inter / max(1, sum(rg.values()))
265
+ return 2.0 * p * rr / max(1e-8, p + rr)
266
+
267
+
268
+ def _lcs_lengths(hyp: str, ref: str) -> Tuple[int, int, int]:
269
+ h = _char_seq(hyp)
270
+ r = _char_seq(ref)
271
+ n, m = len(r), len(h)
272
+ if n == 0 or m == 0:
273
+ return 0, n, m
274
+ prev = [0] * (m + 1)
275
+ for i in range(1, n + 1):
276
+ cur = [0] * (m + 1)
277
+ ri = r[i - 1]
278
+ for j in range(1, m + 1):
279
+ if ri == h[j - 1]:
280
+ cur[j] = prev[j - 1] + 1
281
+ else:
282
+ cur[j] = max(prev[j], cur[j - 1])
283
+ prev = cur
284
+ return prev[m], n, m
285
+
286
+
287
+ def _lcs_f1(hyp: str, ref: str) -> float:
288
+ lcs_len, ref_len, hyp_len = _lcs_lengths(hyp, ref)
289
+ if ref_len == 0 and hyp_len == 0:
290
+ return 1.0
291
+ if ref_len == 0 or hyp_len == 0:
292
+ return 0.0
293
+ p = lcs_len / max(1, hyp_len)
294
+ r = lcs_len / max(1, ref_len)
295
+ return 2.0 * p * r / max(1e-8, p + r)
296
+
297
+
298
+ def _cmp_score(hyp: str, ref: str) -> float:
299
+ return 0.70 * _char_bigram_f1(hyp, ref) + 0.30 * _lcs_f1(hyp, ref)
300
+
301
+
302
+ def wer_reward_main(wer: float) -> float:
303
+ if wer <= 0.15:
304
+ return 1.0 - 1.8 * wer
305
+ elif wer <= 0.35:
306
+ return 0.73 - 2.3 * (wer - 0.15)
307
+ elif wer <= 0.70:
308
+ return 0.27 - 2.4 * (wer - 0.35)
309
+ elif wer <= 1.20:
310
+ return -0.57 - 0.70 * (wer - 0.70)
311
+ else:
312
+ return -0.92
313
+
314
+
315
+ def length_ratio_penalty_v3(
316
+ hyp_len: int,
317
+ ref_len: int,
318
+ soft_min: float = 0.90,
319
+ soft_max: float = 1.10,
320
+ hard_min: float = 0.78,
321
+ hard_max: float = 1.30,
322
+ soft_penalty: float = 0.10,
323
+ hard_penalty: float = 0.36,
324
+ ) -> float:
325
+ ref_len = max(1, ref_len)
326
+ ratio = hyp_len / ref_len
327
+ if soft_min <= ratio <= soft_max:
328
+ return 0.0
329
+ if hard_min <= ratio < soft_min:
330
+ frac = (soft_min - ratio) / max(1e-6, soft_min - hard_min)
331
+ return -soft_penalty * frac
332
+ if soft_max < ratio <= hard_max:
333
+ frac = (ratio - soft_max) / max(1e-6, hard_max - soft_max)
334
+ return -soft_penalty * frac
335
+ if ratio < hard_min:
336
+ frac = min(1.0, (hard_min - ratio) / max(1e-6, hard_min))
337
+ return -(soft_penalty + (hard_penalty - soft_penalty) * frac)
338
+ frac = min(1.0, (ratio - hard_max) / max(1e-6, hard_max))
339
+ return -(soft_penalty + (hard_penalty - soft_penalty) * frac)
340
+
341
+
342
+ def tail_penalty(len_ratio: float) -> float:
343
+ if len_ratio <= 1.15:
344
+ return 0.0
345
+ if len_ratio <= 1.40:
346
+ return -0.28 * (len_ratio - 1.15) / 0.25
347
+ if len_ratio <= 2.0:
348
+ return -0.28 - 0.42 * (len_ratio - 1.40) / 0.60
349
+ return -0.70
350
+
351
+
352
+ def is_hallucination_v56(hyp_toks: List[str], ref_toks: List[str], wer: float, len_ratio: float):
353
+ if len(hyp_toks) == 0:
354
+ return True, "empty"
355
+
356
+ run = 1
357
+ for i in range(1, len(hyp_toks)):
358
+ run = run + 1 if hyp_toks[i] == hyp_toks[i - 1] else 1
359
+ if run >= 5:
360
+ return True, "repeat_run>=5"
361
+
362
+ if len(hyp_toks) >= 8:
363
+ bigrams = [(hyp_toks[i], hyp_toks[i + 1]) for i in range(len(hyp_toks) - 1)]
364
+ c = Counter(bigrams)
365
+ most = c.most_common(1)[0][1]
366
+ if most / max(1, len(bigrams)) > 0.22:
367
+ return True, "repeat_bigram>0.22"
368
+
369
+ if len_ratio > 1.60:
370
+ return True, "len_ratio>1.60"
371
+
372
+ if wer >= 1.20:
373
+ return True, "wer>=1.20"
374
+
375
+ return False, "ok"
376
+
377
+
378
+ def _voices_residual(del_rate: float, len_ratio: float):
379
+ p_del_voice = -0.12 * del_rate - 0.08 * max(0.0, del_rate - 0.10)
380
+ p_under_voice = -0.06 * max(0.0, 0.98 - len_ratio)
381
+ return p_del_voice, p_under_voice
382
+
383
+
384
+ def _noise_residual(sub_rate: float, cmp_score: float):
385
+ p_sub_noise = -0.08 * sub_rate
386
+ p_cmp_noise = -0.04 * (1.0 - cmp_score)
387
+ return p_sub_noise, p_cmp_noise
388
+
389
+
390
+ class ASRWerSubLenCmpHalluDirtyV56(ORM):
391
+ sub_penalty_a = 0.40
392
+ sub_penalty_b = 0.35
393
+ cmp_penalty = 0.14
394
+ hallu_extra_penalty = 0.42
395
+ empty_extra_penalty = 0.28
396
+
397
+ reward_clip_min = -4.0
398
+ reward_clip_max = 2.0
399
+
400
+ def __call__(self, completions, solution=None, **kwargs):
401
+ if solution is None:
402
+ solution = kwargs.get("solution")
403
+ if solution is None:
404
+ return [0.0 for _ in completions]
405
+
406
+ if isinstance(solution, str):
407
+ solution_list = [solution for _ in completions]
408
+ else:
409
+ solution_list = list(solution)
410
+
411
+ rewards = []
412
+ for i, (comp, ref) in enumerate(zip(completions, solution_list)):
413
+ hyp = _extract_completion_text(comp)
414
+ ref = ref or ""
415
+
416
+ ref_toks = _tokenize(ref)
417
+ hyp_toks = _tokenize(hyp)
418
+
419
+ ref_len = max(1, len(ref_toks))
420
+ hyp_len = len(hyp_toks)
421
+ len_ratio = float(hyp_len) / float(ref_len)
422
+
423
+ sub_cnt, del_cnt, ins_cnt = _edit_ops_counts(ref_toks, hyp_toks)
424
+ wer = float(sub_cnt + del_cnt + ins_cnt) / float(ref_len)
425
+
426
+ sub_rate = float(sub_cnt) / float(ref_len)
427
+ del_rate = float(del_cnt) / float(ref_len)
428
+
429
+ r_wer = wer_reward_main(wer)
430
+ p_sub = -float(self.sub_penalty_a) * sub_rate - float(self.sub_penalty_b) * max(0.0, sub_rate - 0.35)
431
+ p_len = length_ratio_penalty_v3(hyp_len=hyp_len, ref_len=ref_len)
432
+ p_tail = tail_penalty(len_ratio)
433
+
434
+ cmp_score = _cmp_score(hyp, ref)
435
+ p_cmp = -float(self.cmp_penalty) * (1.0 - cmp_score)
436
+
437
+ hallu, hallu_reason = is_hallucination_v56(hyp_toks, ref_toks, wer, len_ratio)
438
+ p_hallu = -float(self.hallu_extra_penalty) if hallu else 0.0
439
+ p_empty = -float(self.empty_extra_penalty) if hyp_len == 0 else 0.0
440
+
441
+ dirty_type = _get_dirty_type(kwargs, i)
442
+ p_del_voice = 0.0
443
+ p_under_voice = 0.0
444
+ p_sub_noise = 0.0
445
+ p_cmp_noise = 0.0
446
+
447
+ if dirty_type == "voices_noise_plus_farfield":
448
+ p_del_voice, p_under_voice = _voices_residual(del_rate, len_ratio)
449
+ elif dirty_type == "noise_rsp_pure_noise":
450
+ p_sub_noise, p_cmp_noise = _noise_residual(sub_rate, cmp_score)
451
+
452
+ reward_raw = float(
453
+ r_wer + p_sub + p_len + p_tail + p_cmp + p_hallu + p_empty
454
+ + p_del_voice + p_under_voice + p_sub_noise + p_cmp_noise
455
+ )
456
+ r = max(float(self.reward_clip_min), min(float(self.reward_clip_max), reward_raw))
457
+ rewards.append(r)
458
+
459
+ _append_reward_debug_row(
460
+ reward_name="asr_wer_sub_len_cmp_hallu_dirty_v56",
461
+ kwargs=kwargs,
462
+ row={
463
+ **_collect_common_debug_meta(kwargs, i),
464
+ "index": i,
465
+ "dirty_type_resolved": dirty_type,
466
+ "completion_raw": comp,
467
+ "hyp": hyp,
468
+ "ref": ref,
469
+ "ref_len": ref_len,
470
+ "hyp_len": hyp_len,
471
+ "len_ratio": len_ratio,
472
+ "sub_cnt": sub_cnt,
473
+ "del_cnt": del_cnt,
474
+ "ins_cnt": ins_cnt,
475
+ "wer_calc": wer,
476
+ "sub_rate": sub_rate,
477
+ "del_rate": del_rate,
478
+ "cmp_score": cmp_score,
479
+ "hallu": hallu,
480
+ "hallu_reason": hallu_reason,
481
+ "r_wer": r_wer,
482
+ "p_sub": p_sub,
483
+ "p_len": p_len,
484
+ "p_tail": p_tail,
485
+ "p_cmp": p_cmp,
486
+ "p_hallu": p_hallu,
487
+ "p_empty": p_empty,
488
+ "p_del_voice": p_del_voice,
489
+ "p_under_voice": p_under_voice,
490
+ "p_sub_noise": p_sub_noise,
491
+ "p_cmp_noise": p_cmp_noise,
492
+ "reward_raw": reward_raw,
493
+ "reward": r,
494
+ },
495
+ )
496
+
497
+ return rewards
498
+
499
+
500
+ orms["asr_wer_sub_len_cmp_hallu_dirty_v56"] = ASRWerSubLenCmpHalluDirtyV56
0417train.sh ADDED
@@ -0,0 +1,75 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+
2
+ TRAIN_DATA="/mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/0416upload/lora_0323_10w+55w+error+syn_with_domain_train90_targeted_rl_train90_loramerged_basewer_3suppress_server.jsonl"
3
+ VAL_DATA="/mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/0416upload/lora_0323_10w+55w+error+syn_with_domain_train90_targeted_rl_val5_sample5p_server.jsonl" # <- 你新增的验证集
4
+
5
+ export MASTER_PORT=29540
6
+ export MASTER_ADDR=127.0.0.1
7
+
8
+ ######################
9
+ # 0. 基础环境变量 (wandb)
10
+ ######################
11
+ export WANDB_BASE_URL="https://api.wandb.ai"
12
+ export WANDB_API_KEY="af28909dd03c6220f0ad4df6bd9a0a1fbddb3e55"
13
+ export WANDB_PROJECT="qwen3_asr_swift_dapo" # 对应截图里的项目名
14
+ export WANDB_ENTITY="pang_kaiyu-none" # 对应截图里的 Entity
15
+
16
+ # 让 wandb 在多卡训练时只开一个进程写日志(可选)
17
+ export WANDB_MODE=online
18
+ export NPROC_PER_NODE=4
19
+ export SWIFT_SINGLE_DEVICE_MODE=1
20
+ export PYTORCH_CUDA_ALLOC_CONF=expandable_segments:True
21
+
22
+
23
+ export ASR_REWARD_DEBUG=1
24
+ export ASR_REWARD_DEBUG_PATH=/mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/0416upload/out/qwen3asr_dapo_reward56_4x4x12_12gen_4GPU/reward_debug
25
+ export ASR_REWARD_DEBUG_MAX_ROWS=1000
26
+
27
+
28
+
29
+ swift rlhf \
30
+ --rlhf_type grpo \
31
+ --external_plugins /mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/0416upload/my_qwen3_asr_dapo_register.py /mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/0416upload/0417_reward.py \
32
+ --model /mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/qwen3-asr-merged \
33
+ --model_type my_qwen3_asr_rl \
34
+ --template my_qwen3_asr_rl \
35
+ --dataset ${TRAIN_DATA} \
36
+ --val_dataset ${VAL_DATA} \
37
+ --reward_funcs asr_wer_sub_len_cmp_hallu_dirty_v56 \
38
+ --train_type lora \
39
+ --use_vllm false \
40
+ --log_completions true \
41
+ --loss_type dapo \
42
+ --advantage_estimator grpo \
43
+ --scale_rewards group \
44
+ --num_iterations 2 \
45
+ --beta 0.04 \
46
+ --epsilon_high 0.28 \
47
+ --dynamic_sample true \
48
+ --max_resample_times 4 \
49
+ --overlong_filter true \
50
+ --truncation_strategy delete \
51
+ --num_generations 12 \
52
+ --generation_batch_size 48 \
53
+ --per_device_train_batch_size 4 \
54
+ --per_device_eval_batch_size 4 \
55
+ --gradient_accumulation_steps 12 \
56
+ --num_generations_eval 4 \
57
+ --max_completion_length 256 \
58
+ --temperature 0.50 \
59
+ --top_p 0.95 \
60
+ --top_k 50 \
61
+ --repetition_penalty 1.08 \
62
+ --learning_rate 5e-5 \
63
+ --lr_scheduler_type cosine \
64
+ --warmup_ratio 0.03 \
65
+ --report_to wandb \
66
+ --run_name qwen3asr_dapo_reward56_4x4x12_12gen_4GPU \
67
+ --output_dir /mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/0416upload/out/qwen3asr_dapo_reward56_4x4x12_12gen_4GPU \
68
+ --save_strategy steps \
69
+ --save_steps 20 \
70
+ --logging_steps 5 \
71
+ --freeze_llm false \
72
+ --freeze_vit false \
73
+ --freeze_aligner false \
74
+ --remove_unused_columns false \
75
+ --padding_side left
wandb/debug-internal.log ADDED
@@ -0,0 +1,72 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {"time":"2026-04-18T17:28:47.877484976+08:00","level":"INFO","msg":"stream: starting","core version":"0.23.0"}
2
+ {"time":"2026-04-18T17:28:48.347618035+08:00","level":"INFO","msg":"stream: created new stream","id":"c2a5hfz3"}
3
+ {"time":"2026-04-18T17:28:48.347701352+08:00","level":"INFO","msg":"handler: started","stream_id":"c2a5hfz3"}
4
+ {"time":"2026-04-18T17:28:48.350844585+08:00","level":"INFO","msg":"stream: started","id":"c2a5hfz3"}
5
+ {"time":"2026-04-18T17:28:48.350849894+08:00","level":"INFO","msg":"writer: started","stream_id":"c2a5hfz3"}
6
+ {"time":"2026-04-18T17:28:48.350854798+08:00","level":"INFO","msg":"sender: started","stream_id":"c2a5hfz3"}
7
+ {"time":"2026-04-18T17:37:33.858258418+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/pang_kaiyu-none/qwen3_asr_swift_dapo/c2a5hfz3/file_stream\": unexpected EOF"}
8
+ {"time":"2026-04-19T02:34:07.470718868+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/pang_kaiyu-none/qwen3_asr_swift_dapo/c2a5hfz3/file_stream\": unexpected EOF"}
9
+ {"time":"2026-04-19T02:38:39.32386773+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/pang_kaiyu-none/qwen3_asr_swift_dapo/c2a5hfz3/file_stream\": http2: client conn could not be established"}
10
+ {"time":"2026-04-19T02:40:17.658933776+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/pang_kaiyu-none/qwen3_asr_swift_dapo/c2a5hfz3/file_stream\": unexpected EOF"}
11
+ {"time":"2026-04-19T02:43:03.564180775+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/pang_kaiyu-none/qwen3_asr_swift_dapo/c2a5hfz3/file_stream\": unexpected EOF"}
12
+ {"time":"2026-04-19T02:44:49.518795314+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/pang_kaiyu-none/qwen3_asr_swift_dapo/c2a5hfz3/file_stream\": unexpected EOF"}
13
+ {"time":"2026-04-19T02:45:08.529740538+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/pang_kaiyu-none/qwen3_asr_swift_dapo/c2a5hfz3/file_stream\": unexpected EOF"}
14
+ {"time":"2026-04-19T02:46:20.848321936+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/pang_kaiyu-none/qwen3_asr_swift_dapo/c2a5hfz3/file_stream\": unexpected EOF"}
15
+ {"time":"2026-04-19T02:49:05.639172159+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/pang_kaiyu-none/qwen3_asr_swift_dapo/c2a5hfz3/file_stream\": unexpected EOF"}
16
+ {"time":"2026-04-19T15:09:49.426045163+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/pang_kaiyu-none/qwen3_asr_swift_dapo/c2a5hfz3/file_stream\": unexpected EOF"}
17
+ {"time":"2026-04-19T15:57:04.347389276+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/pang_kaiyu-none/qwen3_asr_swift_dapo/c2a5hfz3/file_stream\": unexpected EOF"}
18
+ {"time":"2026-04-19T16:02:30.488210102+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/pang_kaiyu-none/qwen3_asr_swift_dapo/c2a5hfz3/file_stream\": unexpected EOF"}
19
+ {"time":"2026-04-19T22:07:33.03303113+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/pang_kaiyu-none/qwen3_asr_swift_dapo/c2a5hfz3/file_stream\": unexpected EOF"}
20
+ {"time":"2026-04-19T22:07:51.98901393+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/pang_kaiyu-none/qwen3_asr_swift_dapo/c2a5hfz3/file_stream\": unexpected EOF"}
21
+ {"time":"2026-04-19T22:08:16.035247515+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/pang_kaiyu-none/qwen3_asr_swift_dapo/c2a5hfz3/file_stream\": unexpected EOF"}
22
+ {"time":"2026-04-19T22:09:42.186767689+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/pang_kaiyu-none/qwen3_asr_swift_dapo/c2a5hfz3/file_stream\": unexpected EOF"}
23
+ {"time":"2026-04-19T22:24:00.480169619+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/pang_kaiyu-none/qwen3_asr_swift_dapo/c2a5hfz3/file_stream\": unexpected EOF"}
24
+ {"time":"2026-04-19T22:24:34.690158146+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/pang_kaiyu-none/qwen3_asr_swift_dapo/c2a5hfz3/file_stream\": unexpected EOF"}
25
+ {"time":"2026-04-19T22:28:36.622066809+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/pang_kaiyu-none/qwen3_asr_swift_dapo/c2a5hfz3/file_stream\": unexpected EOF"}
26
+ {"time":"2026-04-19T22:28:59.75540152+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/pang_kaiyu-none/qwen3_asr_swift_dapo/c2a5hfz3/file_stream\": unexpected EOF"}
27
+ {"time":"2026-04-19T22:31:22.975036457+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/pang_kaiyu-none/qwen3_asr_swift_dapo/c2a5hfz3/file_stream\": unexpected EOF"}
28
+ {"time":"2026-04-19T22:34:17.890202383+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/pang_kaiyu-none/qwen3_asr_swift_dapo/c2a5hfz3/file_stream\": unexpected EOF"}
29
+ {"time":"2026-04-19T22:43:21.155119859+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/pang_kaiyu-none/qwen3_asr_swift_dapo/c2a5hfz3/file_stream\": unexpected EOF"}
30
+ {"time":"2026-04-19T22:43:38.33530735+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/pang_kaiyu-none/qwen3_asr_swift_dapo/c2a5hfz3/file_stream\": unexpected EOF"}
31
+ {"time":"2026-04-19T22:46:03.44895843+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/pang_kaiyu-none/qwen3_asr_swift_dapo/c2a5hfz3/file_stream\": unexpected EOF"}
32
+ {"time":"2026-04-19T22:48:50.248056745+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/pang_kaiyu-none/qwen3_asr_swift_dapo/c2a5hfz3/file_stream\": unexpected EOF"}
33
+ {"time":"2026-04-19T22:49:48.447601198+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/pang_kaiyu-none/qwen3_asr_swift_dapo/c2a5hfz3/file_stream\": unexpected EOF"}
34
+ {"time":"2026-04-19T22:52:35.56119014+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/pang_kaiyu-none/qwen3_asr_swift_dapo/c2a5hfz3/file_stream\": unexpected EOF"}
35
+ {"time":"2026-04-19T22:52:50.371922946+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/pang_kaiyu-none/qwen3_asr_swift_dapo/c2a5hfz3/file_stream\": unexpected EOF"}
36
+ {"time":"2026-04-19T22:56:30.747794336+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/pang_kaiyu-none/qwen3_asr_swift_dapo/c2a5hfz3/file_stream\": unexpected EOF"}
37
+ {"time":"2026-04-19T22:58:32.547706574+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/pang_kaiyu-none/qwen3_asr_swift_dapo/c2a5hfz3/file_stream\": unexpected EOF"}
38
+ {"time":"2026-04-19T23:00:23.617563694+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/pang_kaiyu-none/qwen3_asr_swift_dapo/c2a5hfz3/file_stream\": unexpected EOF"}
39
+ {"time":"2026-04-19T23:00:37.717734501+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/pang_kaiyu-none/qwen3_asr_swift_dapo/c2a5hfz3/file_stream\": unexpected EOF"}
40
+ {"time":"2026-04-19T23:05:31.94573349+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/pang_kaiyu-none/qwen3_asr_swift_dapo/c2a5hfz3/file_stream\": unexpected EOF"}
41
+ {"time":"2026-04-19T23:05:44.893259249+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/pang_kaiyu-none/qwen3_asr_swift_dapo/c2a5hfz3/file_stream\": unexpected EOF"}
42
+ {"time":"2026-04-20T00:03:04.382543732+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/pang_kaiyu-none/qwen3_asr_swift_dapo/c2a5hfz3/file_stream\": unexpected EOF"}
43
+ {"time":"2026-04-20T00:03:19.501053157+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/pang_kaiyu-none/qwen3_asr_swift_dapo/c2a5hfz3/file_stream\": unexpected EOF"}
44
+ {"time":"2026-04-20T00:05:31.556601347+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/pang_kaiyu-none/qwen3_asr_swift_dapo/c2a5hfz3/file_stream\": unexpected EOF"}
45
+ {"time":"2026-04-20T00:06:03.495128433+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/pang_kaiyu-none/qwen3_asr_swift_dapo/c2a5hfz3/file_stream\": unexpected EOF"}
46
+ {"time":"2026-04-20T00:11:23.73287074+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/pang_kaiyu-none/qwen3_asr_swift_dapo/c2a5hfz3/file_stream\": unexpected EOF"}
47
+ {"time":"2026-04-20T02:58:43.522847172+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/graphql\": net/http: request canceled (Client.Timeout exceeded while awaiting headers)"}
48
+ {"time":"2026-04-20T02:59:04.598457045+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/pang_kaiyu-none/qwen3_asr_swift_dapo/c2a5hfz3/file_stream\": context deadline exceeded"}
49
+ {"time":"2026-04-20T02:59:15.733502761+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/graphql\": context deadline exceeded (Client.Timeout exceeded while awaiting headers)"}
50
+ {"time":"2026-04-20T02:59:49.917399553+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/graphql\": context deadline exceeded (Client.Timeout exceeded while awaiting headers)"}
51
+ {"time":"2026-04-20T03:00:07.058218433+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/pang_kaiyu-none/qwen3_asr_swift_dapo/c2a5hfz3/file_stream\": context deadline exceeded"}
52
+ {"time":"2026-04-20T03:00:29.606621937+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/graphql\": net/http: request canceled (Client.Timeout exceeded while awaiting headers)"}
53
+ {"time":"2026-04-20T03:00:34.624296643+08:00","level":"INFO","msg":"flowcontrol: backed up, offloading to disk","recordNumber":124381}
54
+ {"time":"2026-04-20T03:00:46.264621657+08:00","level":"INFO","msg":"flowcontrol: unblocked","totalOffloaded":1}
55
+ {"time":"2026-04-20T03:44:43.734398398+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/graphql\": context deadline exceeded (Client.Timeout exceeded while awaiting headers)"}
56
+ {"time":"2026-04-20T04:11:48.762158534+08:00","level":"INFO","msg":"api: retrying HTTP error","status":503,"url":"https://api.wandb.ai/graphql","body":"upstream connect error or disconnect/reset before headers. reset reason: connection termination"}
57
+ {"time":"2026-04-20T04:13:58.74920069+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/graphql\": net/http: request canceled (Client.Timeout exceeded while awaiting headers)"}
58
+ {"time":"2026-04-20T06:34:34.21211755+08:00","level":"INFO","msg":"api: retrying HTTP error","status":503,"url":"https://api.wandb.ai/graphql","body":"upstream connect error or disconnect/reset before headers. reset reason: connection termination"}
59
+ {"time":"2026-04-20T10:50:53.628901466+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/pang_kaiyu-none/qwen3_asr_swift_dapo/c2a5hfz3/file_stream\": unexpected EOF"}
60
+ {"time":"2026-04-20T16:00:42.158363018+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/pang_kaiyu-none/qwen3_asr_swift_dapo/c2a5hfz3/file_stream\": unexpected EOF"}
61
+ {"time":"2026-04-20T16:02:08.101875007+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/pang_kaiyu-none/qwen3_asr_swift_dapo/c2a5hfz3/file_stream\": unexpected EOF"}
62
+ {"time":"2026-04-20T16:03:45.141714956+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/pang_kaiyu-none/qwen3_asr_swift_dapo/c2a5hfz3/file_stream\": unexpected EOF"}
63
+ {"time":"2026-04-20T16:04:52.17332644+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/pang_kaiyu-none/qwen3_asr_swift_dapo/c2a5hfz3/file_stream\": unexpected EOF"}
64
+ {"time":"2026-04-20T16:05:06.320377956+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/pang_kaiyu-none/qwen3_asr_swift_dapo/c2a5hfz3/file_stream\": unexpected EOF"}
65
+ {"time":"2026-04-20T16:05:29.800728083+08:00","level":"ERROR","msg":"sender: sendStopStatus: failed to get run stopped status: context deadline exceeded (Client.Timeout or context cancellation while reading body)"}
66
+ {"time":"2026-04-20T16:05:30.799799131+08:00","level":"INFO","msg":"stream: closing","id":"c2a5hfz3"}
67
+ {"time":"2026-04-20T16:05:39.191906442+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/pang_kaiyu-none/qwen3_asr_swift_dapo/c2a5hfz3/file_stream\": unexpected EOF"}
68
+ {"time":"2026-04-20T16:05:43.710909983+08:00","level":"INFO","msg":"fileTransfer: Close: file transfer manager closed"}
69
+ {"time":"2026-04-20T16:06:10.469686843+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/pang_kaiyu-none/qwen3_asr_swift_dapo/c2a5hfz3/file_stream\": unexpected EOF"}
70
+ {"time":"2026-04-20T16:06:17.397266507+08:00","level":"INFO","msg":"handler: closed","stream_id":"c2a5hfz3"}
71
+ {"time":"2026-04-20T16:06:17.400263519+08:00","level":"INFO","msg":"sender: closed","stream_id":"c2a5hfz3"}
72
+ {"time":"2026-04-20T16:06:17.40028542+08:00","level":"INFO","msg":"stream: closed","id":"c2a5hfz3"}
wandb/debug.log ADDED
@@ -0,0 +1,26 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ 2026-04-18 17:28:47,491 INFO MainThread:10295 [wandb_setup.py:_flush():80] Current SDK version is 0.23.0
2
+ 2026-04-18 17:28:47,491 INFO MainThread:10295 [wandb_setup.py:_flush():80] Configure stats pid to 10295
3
+ 2026-04-18 17:28:47,491 INFO MainThread:10295 [wandb_setup.py:_flush():80] Loading settings from /mnt/petrelfs/panjiabao/.config/wandb/settings
4
+ 2026-04-18 17:28:47,491 INFO MainThread:10295 [wandb_setup.py:_flush():80] Loading settings from /mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/0416upload/wandb/settings
5
+ 2026-04-18 17:28:47,491 INFO MainThread:10295 [wandb_setup.py:_flush():80] Loading settings from environment variables
6
+ 2026-04-18 17:28:47,491 INFO MainThread:10295 [wandb_init.py:setup_run_log_directory():713] Logging user logs to /mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/0416upload/wandb/run-20260418_172847-c2a5hfz3/logs/debug.log
7
+ 2026-04-18 17:28:47,491 INFO MainThread:10295 [wandb_init.py:setup_run_log_directory():714] Logging internal logs to /mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/0416upload/wandb/run-20260418_172847-c2a5hfz3/logs/debug-internal.log
8
+ 2026-04-18 17:28:47,491 INFO MainThread:10295 [wandb_init.py:init():840] calling init triggers
9
+ 2026-04-18 17:28:47,491 INFO MainThread:10295 [wandb_init.py:init():845] wandb.init called with sweep_config: {}
10
+ config: {'_wandb': {}}
11
+ 2026-04-18 17:28:47,491 INFO MainThread:10295 [wandb_init.py:init():888] starting backend
12
+ 2026-04-18 17:28:47,865 INFO MainThread:10295 [wandb_init.py:init():891] sending inform_init request
13
+ 2026-04-18 17:28:47,870 INFO MainThread:10295 [wandb_init.py:init():899] backend started and connected
14
+ 2026-04-18 17:28:47,874 INFO MainThread:10295 [wandb_init.py:init():969] updated telemetry
15
+ 2026-04-18 17:28:47,875 INFO MainThread:10295 [wandb_init.py:init():993] communicating run to backend with 90.0 second timeout
16
+ 2026-04-18 17:28:49,589 INFO MainThread:10295 [wandb_init.py:init():1040] starting run threads in backend
17
+ 2026-04-18 17:28:50,217 INFO MainThread:10295 [wandb_run.py:_console_start():2504] atexit reg
18
+ 2026-04-18 17:28:50,218 INFO MainThread:10295 [wandb_run.py:_redirect():2352] redirect: wrap_raw
19
+ 2026-04-18 17:28:50,218 INFO MainThread:10295 [wandb_run.py:_redirect():2421] Wrapping output streams.
20
+ 2026-04-18 17:28:50,218 INFO MainThread:10295 [wandb_run.py:_redirect():2444] Redirects installed.
21
+ 2026-04-18 17:28:50,224 INFO MainThread:10295 [wandb_init.py:init():1080] run started, returning control to user process
22
+ 2026-04-18 17:28:50,229 INFO MainThread:10295 [wandb_run.py:_config_callback():1385] config_cb None None {'peft_config': {'default': {'task_type': 'CAUSAL_LM', 'peft_type': 'LORA', 'auto_mapping': None, 'peft_version': '0.18.1', 'base_model_name_or_path': '/mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/qwen3-asr-merged', 'revision': None, 'inference_mode': False, 'r': 8, 'target_modules': '^(thinker\\.model(?=\\.).*\\.(up_proj|q_proj|o_proj|gate_proj|k_proj|v_proj|down_proj)|thinker\\.audio_tower\\.layers(?=\\.).*\\.(q_proj|fc1|out_proj|k_proj|v_proj|fc2)|thinker\\.audio_tower\\.conv_out(?=\\.)|thinker\\.audio_tower\\.proj1(?=\\.)|thinker\\.audio_tower\\.proj2(?=\\.))$', 'exclude_modules': None, 'lora_alpha': 32, 'lora_dropout': 0.05, 'fan_in_fan_out': False, 'bias': 'none', 'use_rslora': False, 'modules_to_save': [], 'init_lora_weights': True, 'layers_to_transform': None, 'layers_pattern': None, 'rank_pattern': {}, 'alpha_pattern': {}, 'megatron_config': None, 'megatron_core': 'megatron.core', 'trainable_token_indices': None, 'loftq_config': {}, 'eva_config': None, 'corda_config': None, 'use_dora': False, 'alora_invocation_tokens': None, 'use_qalora': False, 'qalora_group_size': 16, 'layer_replication': None, 'runtime_config': {'ephemeral_gpu_offload': False}, 'lora_bias': False, 'target_parameters': None, 'arrow_config': None, 'ensure_weight_tying': False, 'lora_dtype': None, 'lorap_lr_ratio': None, 'lorap_emb_lr': 1e-06}}, 'return_dict': True, 'output_hidden_states': False, 'torchscript': False, 'dtype': 'bfloat16', 'pruned_heads': {}, 'tie_word_embeddings': True, 'chunk_size_feed_forward': 0, 'is_encoder_decoder': False, 'is_decoder': False, 'cross_attention_hidden_size': None, 'add_cross_attention': False, 'tie_encoder_decoder': False, 'architectures': ['Qwen3ASRForConditionalGeneration'], 'finetuning_task': None, 'id2label': {0: 'LABEL_0', 1: 'LABEL_1'}, 'label2id': {'LABEL_0': 0, 'LABEL_1': 1}, 'task_specific_params': None, 'problem_type': None, 'tokenizer_class': None, 'prefix': None, 'bos_token_id': None, 'pad_token_id': 151643, 'eos_token_id': 151645, 'sep_token_id': None, 'decoder_start_token_id': None, 'max_length': 20, 'min_length': 0, 'do_sample': False, 'early_stopping': False, 'num_beams': 1, 'temperature': 0.5, 'top_k': 50, 'top_p': 0.95, 'typical_p': 1.0, 'repetition_penalty': 1.08, 'length_penalty': 1.0, 'no_repeat_ngram_size': 0, 'encoder_no_repeat_ngram_size': 0, 'bad_words_ids': None, 'num_return_sequences': 1, 'output_scores': False, 'return_dict_in_generate': False, 'forced_bos_token_id': None, 'forced_eos_token_id': None, 'remove_invalid_values': False, 'exponential_decay_length_penalty': None, 'suppress_tokens': None, 'begin_suppress_tokens': None, 'num_beam_groups': 1, 'diversity_penalty': 0.0, '_name_or_path': '/mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/qwen3-asr-merged', 'transformers_version': '4.57.6', 'model_type': 'qwen3_asr', 'tf_legacy_loss': False, 'use_bfloat16': False, 'thinker_config': {'return_dict': True, 'output_hidden_states': False, 'torchscript': False, 'dtype': 'bfloat16', 'pruned_heads': {}, 'tie_word_embeddings': True, 'chunk_size_feed_forward': 0, 'is_encoder_decoder': False, 'is_decoder': False, 'cross_attention_hidden_size': None, 'add_cross_attention': False, 'tie_encoder_decoder': False, 'architectures': ['Qwen3ASRForConditionalGeneration'], 'finetuning_task': None, 'id2label': {0: 'LABEL_0', 1: 'LABEL_1'}, 'label2id': {'LABEL_0': 0, 'LABEL_1': 1}, 'task_specific_params': None, 'problem_type': None, 'tokenizer_class': None, 'prefix': None, 'bos_token_id': None, 'pad_token_id': None, 'eos_token_id': None, 'sep_token_id': None, 'decoder_start_token_id': None, 'max_length': 20, 'min_length': 0, 'do_sample': False, 'early_stopping': False, 'num_beams': 1, 'temperature': 1.0, 'top_k': 50, 'top_p': 1.0, 'typical_p': 1.0, 'repetition_penalty': 1.0, 'length_penalty': 1.0, 'no_repeat_ngram_size': 0, 'encoder_no_repeat_ngram_size': 0, 'bad_words_ids': None, 'num_return_sequences': 1, 'output_scores': False, 'return_dict_in_generate': False, 'forced_bos_token_id': None, 'forced_eos_token_id': None, 'remove_invalid_values': False, 'exponential_decay_length_penalty': None, 'suppress_tokens': None, 'begin_suppress_tokens': None, 'num_beam_groups': 1, 'diversity_penalty': 0.0, '_name_or_path': '', 'audio_end_token_id': 151670, 'model_type': 'qwen3_asr_thinker', 'tf_legacy_loss': False, 'use_bfloat16': False, 'user_token_id': 872, 'audio_start_token_id': 151669, 'initializer_range': 0.02, 'audio_config': {'return_dict': True, 'output_hidden_states': False, 'torchscript': False, 'dtype': None, 'pruned_heads': {}, 'tie_word_embeddings': True, 'chunk_size_feed_forward': 0, 'is_encoder_decoder': False, 'is_decoder': False, 'cross_attention_hidden_size': None, 'add_cross_attention': False, 'tie_encoder_decoder': False, 'architectures': None, 'finetuning_task': None, 'id2label': {0: 'LABEL_0', 1: 'LABEL_1'}, 'label2id': {'LABEL_0': 0, 'LABEL_1': 1}, 'task_specific_params': None, 'problem_type': None, 'tokenizer_class': None, 'prefix': None, 'bos_token_id': None, 'pad_token_id': None, 'eos_token_id': None, 'sep_token_id': None, 'decoder_start_token_id': None, 'max_length': 20, 'min_length': 0, 'do_sample': False, 'early_stopping': False, 'num_beams': 1, 'temperature': 1.0, 'top_k': 50, 'top_p': 1.0, 'typical_p': 1.0, 'repetition_penalty': 1.0, 'length_penalty': 1.0, 'no_repeat_ngram_size': 0, 'encoder_no_repeat_ngram_size': 0, 'bad_words_ids': None, 'num_return_sequences': 1, 'output_scores': False, 'return_dict_in_generate': False, 'forced_bos_token_id': None, 'forced_eos_token_id': None, 'remove_invalid_values': False, 'exponential_decay_length_penalty': None, 'suppress_tokens': None, 'begin_suppress_tokens': None, 'num_beam_groups': 1, 'diversity_penalty': 0.0, '_name_or_path': '', 'model_type': 'qwen3_asr_audio_encoder', 'num_hidden_layers': 24, 'tf_legacy_loss': False, 'use_bfloat16': False, 'num_mel_bins': 128, 'd_model': 1024, 'encoder_layers': 24, 'encoder_attention_heads': 16, 'encoder_ffn_dim': 4096, 'dropout': 0, 'attention_dropout': 0, 'activation_function': 'gelu', 'activation_dropout': 0, 'initializer_range': 0.02, 'scale_embedding': False, 'max_source_positions': 1500, 'n_window': 50, 'output_dim': 2048, 'n_window_infer': 800, 'conv_chunksize': 500, 'downsample_hidden_size': 480, 'output_attentions': False}, 'text_config': {'vocab_size': 151936, 'max_position_embeddings': 65536, 'hidden_size': 2048, 'intermediate_size': 6144, 'num_hidden_layers': 28, 'num_attention_heads': 16, 'num_key_value_heads': 8, 'head_dim': 128, 'hidden_act': 'silu', 'initializer_range': 0.02, 'rms_norm_eps': 1e-06, 'use_cache': False, 'rope_theta': 1000000, 'rope_scaling': {'interleaved': True, 'mrope_interleaved': True, 'mrope_section': [24, 20, 20], 'rope_type': 'default', 'type': 'default'}, 'attention_bias': False, 'attention_dropout': 0.0, 'return_dict': True, 'output_hidden_states': False, 'torchscript': False, 'dtype': None, 'pruned_heads': {}, 'tie_word_embeddings': True, 'chunk_size_feed_forward': 0, 'is_encoder_decoder': False, 'is_decoder': False, 'cross_attention_hidden_size': None, 'add_cross_attention': False, 'tie_encoder_decoder': False, 'architectures': None, 'finetuning_task': None, 'id2label': {0: 'LABEL_0', 1: 'LABEL_1'}, 'label2id': {'LABEL_0': 0, 'LABEL_1': 1}, 'task_specific_params': None, 'problem_type': None, 'tokenizer_class': None, 'prefix': None, 'bos_token_id': None, 'pad_token_id': 151643, 'eos_token_id': None, 'sep_token_id': None, 'decoder_start_token_id': None, 'max_length': 20, 'min_length': 0, 'do_sample': False, 'early_stopping': False, 'num_beams': 1, 'temperature': 1.0, 'top_k': 50, 'top_p': 1.0, 'typical_p': 1.0, 'repetition_penalty': 1.0, 'length_penalty': 1.0, 'no_repeat_ngram_size': 0, 'encoder_no_repeat_ngram_size': 0, 'bad_words_ids': None, 'num_return_sequences': 1, 'output_scores': False, 'return_dict_in_generate': False, 'forced_bos_token_id': None, 'forced_eos_token_id': None, 'remove_invalid_values': False, 'exponential_decay_length_penalty': None, 'suppress_tokens': None, 'begin_suppress_tokens': None, 'num_beam_groups': 1, 'diversity_penalty': 0.0, '_name_or_path': '', 'model_type': 'qwen3_asr_text', 'tf_legacy_loss': False, 'use_bfloat16': False, 'output_attentions': False}, 'audio_token_id': 151676, 'output_attentions': False}, 'support_languages': ['Chinese', 'English', 'Cantonese', 'Arabic', 'German', 'French', 'Spanish', 'Portuguese', 'Indonesian', 'Italian', 'Korean', 'Russian', 'Thai', 'Vietnamese', 'Japanese', 'Turkish', 'Hindi', 'Malay', 'Dutch', 'Swedish', 'Danish', 'Finnish', 'Polish', 'Czech', 'Filipino', 'Persian', 'Greek', 'Romanian', 'Hungarian', 'Macedonian'], 'output_attentions': False, 'output_dir': '/mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/0416upload/out/qwen3asr_dapo_reward56_4x4x12_12gen_4GPU/v5-20260418-172837', 'overwrite_output_dir': False, 'do_train': False, 'do_eval': True, 'do_predict': False, 'eval_strategy': 'steps', 'prediction_loss_only': False, 'per_device_train_batch_size': 4, 'per_device_eval_batch_size': 4, 'per_gpu_train_batch_size': None, 'per_gpu_eval_batch_size': None, 'gradient_accumulation_steps': 12, 'eval_accumulation_steps': None, 'eval_delay': 0, 'torch_empty_cache_steps': None, 'learning_rate': 5e-05, 'weight_decay': 0.1, 'adam_beta1': 0.9, 'adam_beta2': 0.95, 'adam_epsilon': 1e-08, 'max_grad_norm': 1.0, 'num_train_epochs': 3.0, 'max_steps': -1, 'lr_scheduler_type': 'cosine', 'lr_scheduler_kwargs': None, 'warmup_ratio': 0.03, 'warmup_steps': 0, 'log_level': 'passive', 'log_level_replica': 'warning', 'log_on_each_node': True, 'logging_dir': '/mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/0416upload/out/qwen3asr_dapo_reward56_4x4x12_12gen_4GPU/v5-20260418-172837/runs', 'logging_strategy': 'steps', 'logging_first_step': True, 'logging_steps': 5, 'logging_nan_inf_filter': True, 'save_strategy': 'steps', 'save_steps': 20, 'save_total_limit': None, 'save_safetensors': True, 'save_on_each_node': False, 'save_only_model': False, 'restore_callback_states_from_checkpoint': False, 'no_cuda': False, 'use_cpu': False, 'use_mps_device': False, 'seed': 42, 'data_seed': 42, 'jit_mode_eval': False, 'bf16': True, 'fp16': False, 'fp16_opt_level': 'O1', 'half_precision_backend': 'auto', 'bf16_full_eval': False, 'fp16_full_eval': False, 'tf32': None, 'local_rank': 0, 'ddp_backend': None, 'tpu_num_cores': None, 'tpu_metrics_debug': False, 'debug': [], 'dataloader_drop_last': True, 'eval_steps': 20, 'dataloader_num_workers': 1, 'dataloader_prefetch_factor': 2, 'past_index': -1, 'run_name': 'qwen3asr_dapo_reward56_4x4x12_12gen_4GPU', 'disable_tqdm': False, 'remove_unused_columns': False, 'label_names': None, 'load_best_model_at_end': False, 'metric_for_best_model': 'loss', 'greater_is_better': False, 'ignore_data_skip': False, 'fsdp': [], 'fsdp_min_num_params': 0, 'fsdp_config': {'min_num_params': 0, 'xla': False, 'xla_fsdp_v2': False, 'xla_fsdp_grad_ckpt': False}, 'fsdp_transformer_layer_cls_to_wrap': None, 'accelerator_config': {'split_batches': False, 'dispatch_batches': False, 'even_batches': True, 'use_seedable_sampler': True, 'non_blocking': False, 'gradient_accumulation_kwargs': None}, 'parallelism_config': None, 'deepspeed': None, 'label_smoothing_factor': 0.0, 'optim': 'adamw_torch', 'optim_args': None, 'adafactor': False, 'group_by_length': False, 'length_column_name': 'length', 'report_to': ['wandb'], 'project': 'huggingface', 'trackio_space_id': 'trackio', 'ddp_find_unused_parameters': None, 'ddp_bucket_cap_mb': None, 'ddp_broadcast_buffers': None, 'dataloader_pin_memory': True, 'dataloader_persistent_workers': False, 'skip_memory_metrics': True, 'use_legacy_prediction_loop': False, 'push_to_hub': False, 'resume_from_checkpoint': None, 'hub_model_id': None, 'hub_strategy': 'every_save', 'hub_token': '<HUB_TOKEN>', 'hub_private_repo': None, 'hub_always_push': False, 'hub_revision': None, 'gradient_checkpointing': False, 'gradient_checkpointing_kwargs': None, 'include_inputs_for_metrics': False, 'include_for_metrics': [], 'eval_do_concat_batches': True, 'fp16_backend': 'auto', 'push_to_hub_model_id': None, 'push_to_hub_organization': None, 'push_to_hub_token': '<PUSH_TO_HUB_TOKEN>', 'mp_parameters': '', 'auto_find_batch_size': False, 'full_determinism': False, 'torchdynamo': None, 'ray_scope': 'last', 'ddp_timeout': 18000000, 'torch_compile': False, 'torch_compile_backend': None, 'torch_compile_mode': None, 'include_tokens_per_second': False, 'include_num_input_tokens_seen': 'no', 'neftune_noise_alpha': None, 'optim_target_modules': None, 'batch_eval_metrics': False, 'eval_on_start': False, 'use_liger_kernel': False, 'liger_kernel_config': None, 'eval_use_gather_object': False, 'average_tokens_across_devices': True, 'model_init_kwargs': None, 'disable_dropout': False, 'cast_lm_head_to_fp32': False, 'num_generations': 12, 'num_generations_eval': 4, 'max_completion_length': 256, 'ds3_gather_for_generation': True, 'shuffle_dataset': True, 'generation_batch_size': 48, 'steps_per_generation': 3, 'min_p': None, 'generation_kwargs': None, 'chat_template_kwargs': None, 'use_transformers_paged': False, 'cache_implementation': None, 'use_vllm': False, 'vllm_mode': None, 'vllm_model_impl': 'vllm', 'vllm_enable_sleep_mode': False, 'vllm_structured_outputs_regex': None, 'vllm_server_base_url': None, 'vllm_server_host': None, 'vllm_server_port': [8000], 'vllm_server_timeout': 240.0, 'vllm_group_port': 51216, 'vllm_gpu_memory_utilization': 0.9, 'vllm_max_model_length': None, 'vllm_tensor_parallel_size': 1, 'beta': 0.04, 'num_iterations': 2, 'epsilon': 0.2, 'delta': None, 'epsilon_high': 0.28, 'sapo_temperature_neg': 1.05, 'sapo_temperature_pos': 1.0, 'importance_sampling_level': 'token', 'reward_weights': None, 'multi_objective_aggregation': 'sum_then_normalize', 'scale_rewards': 'group', 'loss_type': 'dapo', 'mask_truncated_completions': False, 'sync_ref_model': False, 'ref_model_mixup_alpha': 0.6, 'ref_model_sync_steps': 512, 'top_entropy_quantile': 1.0, 'max_tool_calling_iterations': None, 'vllm_importance_sampling_correction': True, 'vllm_importance_sampling_mode': 'sequence_mask', 'vllm_importance_sampling_cap': 3.0, 'off_policy_mask_threshold': None, 'use_bias_correction_kl': False, 'log_completions': True, 'num_completions_to_print': None, 'log_unique_prompts': False, 'log_completions_hub_repo': None, 'tuner_backend': 'peft', 'vit_gradient_checkpointing': True, 'router_aux_loss_coef': 0.0, 'enable_dft_loss': False, 'enable_channel_loss': False, 'safe_serialization': True, 'max_shard_size': '5GB', 'check_model': True, 'acc_strategy': 'token', 'train_dataloader_shuffle': True, 'max_epochs': None, 'aligner_lr': None, 'vit_lr': None, 'use_logits_to_keep': None, 'resume_only_model': False, 'optimizer': None, 'eval_metric': None, 'callbacks': [], 'early_stop_interval': None, 'eval_use_evalscope': False, 'eval_dataset': [], 'eval_dataset_args': None, 'eval_limit': None, 'eval_generation_config': None, 'extra_eval_args': None, 'tuner_type': 'lora', 'use_galore': False, 'galore_target_modules': None, 'galore_rank': 128, 'galore_update_proj_gap': 50, 'galore_scale': 1.0, 'galore_proj_type': 'std', 'galore_optim_per_parameter': False, 'galore_with_embedding': False, 'galore_quantization': False, 'galore_proj_quant': False, 'galore_proj_bits': 4, 'galore_proj_group_size': 256, 'galore_cos_threshold': 0.4, 'galore_gamma_proj': 2, 'galore_queue_size': 5, 'lisa_activated_layers': 0, 'lisa_step_interval': 20, 'use_flash_ckpt': False, 'vllm_pipeline_parallel_size': 1, 'vllm_enable_expert_parallel': False, 'vllm_max_num_seqs': None, 'vllm_max_model_len': None, 'vllm_disable_custom_all_reduce': True, 'vllm_enforce_eager': False, 'vllm_limit_mm_per_prompt': None, 'vllm_max_lora_rank': 16, 'vllm_enable_prefix_caching': True, 'vllm_use_async_engine': None, 'vllm_quantization': None, 'vllm_reasoning_parser': None, 'vllm_disable_cascade_attn': False, 'vllm_mm_processor_cache_gb': None, 'vllm_speculative_config': None, 'vllm_engine_kwargs': {}, 'vllm_data_parallel_size': 1, 'stop_words': [], 'vllm_enable_lora': False, 'lora_rank': 8, 'vllm_server_group_port': None, 'enable_flattened_weight_sync': True, 'async_generate': False, 'structured_outputs_regex': None, 'sleep_level': 0, 'move_model_batches': None, 'offload_optimizer': False, 'offload_model': False, 'wandb_log_unique_prompts': None, 'cosine_min_len_value_wrong': -0.5, 'cosine_max_len_value_wrong': 0.0, 'cosine_min_len_value_correct': 1.0, 'cosine_max_len_value_correct': 0.5, 'cosine_max_len': 256, 'repetition_n_grams': 3, 'repetition_max_penalty': -1.0, 'reward_model': None, 'reward_model_plugin': None, 'chord_sft_dataset': [], 'chord_sft_per_device_train_batch_size': None, 'chord_enable_phi_function': False, 'chord_mu_warmup_steps': None, 'chord_mu_decay_steps': None, 'chord_mu_peak': None, 'chord_mu_valley': None, 'multi_turn_scheduler': None, 'max_turns': None, 'completion_length_limit_scope': 'per_round', 'vllm_server_pass_dataset': False, 'dynamic_sample': True, 'max_resample_times': 4, 'overlong_filter': True, 'soft_max_length': None, 'soft_cache_length': None, 'log_entropy': False, 'tau_pos': 1.0, 'tau_neg': 1.05, 'advantage_estimator': 'grpo', 'kl_in_reward': False, 'dataset_shuffle': True, 'rollout_importance_sampling_mode': None, 'rollout_importance_sampling_threshold': 2.0, 'log_rollout_offpolicy_metrics': False, 'off_policy_sequence_mask_delta': None}
23
+ 2026-04-18 17:28:50,239 INFO MainThread:10295 [wandb_config.py:__setitem__():154] [no run ID] config set model/num_parameters = 2050307712 - <bound method Run._config_callback of <wandb.sdk.wandb_run.Run object at 0x7f7e494768f0>>
24
+ 2026-04-18 17:28:50,239 INFO MainThread:10295 [wandb_run.py:_config_callback():1385] config_cb model/num_parameters 2050307712 None
25
+ 2026-04-20 16:05:30,791 INFO wandb-AsyncioManager-main:10295 [service_client.py:_forward_responses():80] Reached EOF.
26
+ 2026-04-20 16:05:30,792 INFO wandb-AsyncioManager-main:10295 [mailbox.py:close():137] Closing mailbox, abandoning 1 handles.
wandb/run-20260417_122253-6ntp64iz/files/output.log ADDED
The diff for this file is too large to render. See raw diff
 
wandb/run-20260417_122253-6ntp64iz/files/requirements.txt ADDED
@@ -0,0 +1,255 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ psutil==7.2.2
2
+ colorama==0.4.6
3
+ typing-inspection==0.4.2
4
+ dill==0.3.8
5
+ aliyun-python-sdk-kms==2.16.5
6
+ urllib3==2.6.3
7
+ torch==2.6.0
8
+ threadpoolctl==3.6.0
9
+ pyzmq==27.1.0
10
+ astor==0.8.1
11
+ hf-xet==1.4.3
12
+ sniffio==1.3.1
13
+ tensorboard==2.20.0
14
+ fastar==0.11.0
15
+ llvmlite==0.43.0
16
+ pathspec==1.0.4
17
+ mkl_fft==1.3.11
18
+ prometheus_client==0.25.0
19
+ async-timeout==5.0.1
20
+ scikit-learn==1.7.2
21
+ sortedcontainers==2.4.0
22
+ Bottleneck==1.4.2
23
+ orjson==3.11.8
24
+ nest-asyncio==1.6.0
25
+ cupy-cuda12x==13.6.0
26
+ semantic-version==2.10.0
27
+ aiosignal==1.4.0
28
+ fsspec==2025.3.0
29
+ dyNET38==2.2
30
+ shellingham==1.5.4
31
+ zstandard==0.25.0
32
+ PyYAML==6.0.3
33
+ nvidia-curand-cu12==10.3.5.147
34
+ gradio==5.50.0
35
+ Werkzeug==3.1.8
36
+ grpcio==1.80.0
37
+ aiohttp==3.13.5
38
+ Flask==3.1.3
39
+ python-json-logger==4.1.0
40
+ trl==0.29.1
41
+ nltk==3.9.4
42
+ platformdirs==4.9.6
43
+ lm-format-enforcer==0.10.12
44
+ pyparsing==3.3.2
45
+ jmespath==0.10.0
46
+ starlette==0.52.1
47
+ crcmod==1.7
48
+ dnspython==2.8.0
49
+ antlr4-python3-runtime==4.9.3
50
+ rouge==1.0.1
51
+ importlib_metadata==9.0.0
52
+ nvidia-cudnn-cu12==9.1.0.70
53
+ safetensors==0.7.0
54
+ blake3==1.0.8
55
+ interegular==0.3.3
56
+ tiktoken==0.11.0
57
+ pydantic_core==2.41.4
58
+ outlines==0.1.11
59
+ airportsdata==20260315
60
+ rich-toolkit==0.19.7
61
+ multiprocess==0.70.16
62
+ sympy==1.13.1
63
+ psutil==7.2.2
64
+ h11==0.16.0
65
+ anyio==4.13.0
66
+ Cython==3.2.4
67
+ outlines_core==0.1.26
68
+ jsonschema==4.26.0
69
+ nvidia-cuda-cupti-cu12==12.4.127
70
+ meson-python==0.19.0
71
+ depyf==0.18.0
72
+ audioread==3.1.0
73
+ typer==0.24.1
74
+ nvidia-cuda-nvrtc-cu12==12.4.127
75
+ joblib==1.5.3
76
+ torchvision==0.21.0
77
+ hf-gradio==0.3.2
78
+ huggingface_hub==0.36.2
79
+ websockets==15.0.1
80
+ diskcache==5.6.3
81
+ mistral_common==1.11.0
82
+ partial-json-parser==0.2.1.1.post7
83
+ simplejson==3.20.2
84
+ watchfiles==1.1.1
85
+ Jinja2==3.1.6
86
+ GitPython==3.1.46
87
+ numexpr==2.11.0
88
+ pydub==0.25.1
89
+ brotli==1.2.0
90
+ binpacking==2.0.1
91
+ cmake==4.3.1
92
+ pydantic==2.12.3
93
+ mkl-service==2.4.0
94
+ protobuf==6.33.6
95
+ gguf==0.10.0
96
+ MarkupSafe==3.0.3
97
+ exceptiongroup==1.3.1
98
+ markdown-it-py==4.0.0
99
+ soxr==1.0.0
100
+ pyarrow==20.0.0
101
+ tqdm==4.67.3
102
+ meson==1.11.0
103
+ fonttools==4.62.1
104
+ annotated-types==0.7.0
105
+ networkx==3.4.2
106
+ nvidia-cuda-runtime-cu12==12.4.127
107
+ compressed-tensors==0.9.2
108
+ wandb==0.23.0
109
+ mdurl==0.1.2
110
+ charset-normalizer==3.4.7
111
+ Pygments==2.20.0
112
+ zipp==3.23.1
113
+ prometheus-fastapi-instrumentator==7.1.0
114
+ aiofiles==24.1.0
115
+ lark==1.2.2
116
+ addict==2.4.0
117
+ pydantic-settings==2.13.1
118
+ opencv-python-headless==4.11.0.86
119
+ certifi==2026.2.25
120
+ sox==1.5.0
121
+ nagisa==0.2.11
122
+ six==1.17.0
123
+ tokenizers==0.22.2
124
+ mkl_random==1.2.8
125
+ fastapi-cloud-cli==0.17.0
126
+ propcache==0.4.1
127
+ cachetools==7.0.5
128
+ rpds-py==0.30.0
129
+ torchaudio==2.6.0
130
+ setuptools==82.0.1
131
+ py-cpuinfo==9.0.0
132
+ tomli==2.4.1
133
+ xxhash==3.6.0
134
+ pip==26.0.1
135
+ contourpy==1.3.2
136
+ absl-py==2.4.0
137
+ mpmath==1.3.0
138
+ ms_swift==4.0.3
139
+ pyproject-metadata==0.11.0
140
+ aiohappyeyeballs==2.6.1
141
+ httpx==0.28.1
142
+ json_repair==0.59.4
143
+ blinker==1.9.0
144
+ tzdata==2025.3
145
+ tensorboard-data-server==0.7.2
146
+ pydantic-extra-types==2.11.1
147
+ Markdown==3.10.2
148
+ nvidia-cusparselt-cu12==0.6.2
149
+ rignore==0.7.6
150
+ openai==2.32.0
151
+ soundfile==0.13.1
152
+ lazy-loader==0.5
153
+ av==14.2.0
154
+ yarl==1.23.0
155
+ python-dateutil==2.9.0.post0
156
+ groovy==0.1.2
157
+ xformers==0.0.29.post2
158
+ qwen-omni-utils==0.0.9
159
+ rich==15.0.0
160
+ xgrammar==0.1.16
161
+ numba==0.60.0
162
+ nvidia-cusolver-cu12==11.6.1.9
163
+ scikit_build_core==0.12.2
164
+ ffmpy==1.0.0
165
+ wheel==0.46.3
166
+ jiter==0.14.0
167
+ oss2==2.19.1
168
+ transformers==4.57.6
169
+ fastrlock==0.8.3
170
+ click==8.3.2
171
+ pooch==1.9.0
172
+ distro==1.9.0
173
+ nvidia-cublas-cu12==12.4.5.8
174
+ regex==2026.4.4
175
+ cpm-kernels==1.0.11
176
+ safehttpx==0.1.7
177
+ matplotlib==3.10.8
178
+ httptools==0.7.1
179
+ nvidia-cusparse-cu12==12.3.1.170
180
+ qwen-asr==0.0.6
181
+ gradio_client==1.14.0
182
+ gitdb==4.0.12
183
+ fastapi-cli==0.0.24
184
+ soynlp==0.0.493
185
+ python-dotenv==1.2.2
186
+ nvidia-cufft-cu12==11.2.1.3
187
+ accelerate==1.12.0
188
+ tomlkit==0.13.3
189
+ triton==3.2.0
190
+ filelock==3.28.0
191
+ pycountry==26.2.16
192
+ modelscope==1.35.4
193
+ annotated-doc==0.0.4
194
+ referencing==0.37.0
195
+ numpy==1.26.4
196
+ aliyun-python-sdk-core==2.16.0
197
+ attrs==26.1.0
198
+ vllm==0.8.0
199
+ python-multipart==0.0.26
200
+ jsonschema-specifications==2025.9.1
201
+ idna==3.11
202
+ scipy==1.15.3
203
+ typing_extensions==4.15.0
204
+ itsdangerous==2.2.0
205
+ msgspec==0.21.1
206
+ msgpack==1.1.2
207
+ nvidia-nvjitlink-cu12==12.4.127
208
+ pycryptodome==3.23.0
209
+ ninja==1.13.0
210
+ pillow==11.3.0
211
+ email-validator==2.3.0
212
+ cryptography==46.0.7
213
+ peft==0.18.1
214
+ kiwisolver==1.5.0
215
+ cffi==2.0.0
216
+ einops==0.8.2
217
+ pytz==2026.1.post1
218
+ uvloop==0.22.1
219
+ requests==2.33.1
220
+ sentencepiece==0.2.1
221
+ attrdict==2.0.1
222
+ dacite==1.9.2
223
+ cloudpickle==3.1.2
224
+ ray==2.55.0
225
+ fastapi==0.135.3
226
+ librosa==0.11.0
227
+ ruff==0.15.10
228
+ multidict==6.7.1
229
+ smmap==5.0.3
230
+ packaging==26.0
231
+ pycparser==3.0
232
+ decorator==5.2.1
233
+ transformers-stream-generator==0.0.5
234
+ nvidia-nccl-cu12==2.21.5
235
+ frozenlist==1.8.0
236
+ uvicorn==0.44.0
237
+ datasets==3.6.0
238
+ cycler==0.12.1
239
+ omegaconf==2.3.0
240
+ httpcore==1.0.9
241
+ pandas==2.3.2
242
+ nvidia-nvtx-cu12==12.4.127
243
+ sentry-sdk==2.58.0
244
+ wheel==0.46.3
245
+ autocommand==2.2.2
246
+ tomli==2.4.0
247
+ packaging==26.0
248
+ more-itertools==10.8.0
249
+ zipp==3.23.0
250
+ platformdirs==4.4.0
251
+ jaraco.context==6.1.0
252
+ jaraco.text==4.0.0
253
+ backports.tarfile==1.2.0
254
+ jaraco.functools==4.4.0
255
+ importlib_metadata==8.7.1
wandb/run-20260417_122253-6ntp64iz/files/wandb-metadata.json ADDED
@@ -0,0 +1,223 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "os": "Linux-3.10.0-957.el7.x86_64-x86_64-with-glibc2.17",
3
+ "python": "CPython 3.10.18",
4
+ "startedAt": "2026-04-17T04:22:53.361994Z",
5
+ "args": [
6
+ "--rlhf_type",
7
+ "grpo",
8
+ "--external_plugins",
9
+ "/mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/0416upload/my_qwen3_asr_dapo_register.py",
10
+ "/mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/0416upload/0417_reward.py",
11
+ "--model",
12
+ "/mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/qwen3-asr-merged",
13
+ "--model_type",
14
+ "my_qwen3_asr_rl",
15
+ "--template",
16
+ "my_qwen3_asr_rl",
17
+ "--dataset",
18
+ "/mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/0416upload/lora_0323_10w+55w+error+syn_with_domain_train90_targeted_rl_train90_loramerged_basewer_3suppress_server.jsonl",
19
+ "--val_dataset",
20
+ "/mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/0416upload/lora_0323_10w+55w+error+syn_with_domain_train90_targeted_rl_val5_sample5p_server.jsonl",
21
+ "--reward_funcs",
22
+ "asr_wer_sub_len_cmp_hallu_dirty_v56",
23
+ "--train_type",
24
+ "lora",
25
+ "--use_vllm",
26
+ "false",
27
+ "--log_completions",
28
+ "true",
29
+ "--loss_type",
30
+ "dapo",
31
+ "--advantage_estimator",
32
+ "grpo",
33
+ "--scale_rewards",
34
+ "group",
35
+ "--num_iterations",
36
+ "2",
37
+ "--beta",
38
+ "0.04",
39
+ "--epsilon_high",
40
+ "0.28",
41
+ "--dynamic_sample",
42
+ "true",
43
+ "--max_resample_times",
44
+ "4",
45
+ "--overlong_filter",
46
+ "true",
47
+ "--truncation_strategy",
48
+ "delete",
49
+ "--num_generations",
50
+ "12",
51
+ "--generation_batch_size",
52
+ "48",
53
+ "--per_device_train_batch_size",
54
+ "8",
55
+ "--per_device_eval_batch_size",
56
+ "8",
57
+ "--gradient_accumulation_steps",
58
+ "12",
59
+ "--num_generations_eval",
60
+ "4",
61
+ "--max_completion_length",
62
+ "256",
63
+ "--temperature",
64
+ "0.50",
65
+ "--top_p",
66
+ "0.95",
67
+ "--top_k",
68
+ "50",
69
+ "--repetition_penalty",
70
+ "1.08",
71
+ "--learning_rate",
72
+ "5e-5",
73
+ "--lr_scheduler_type",
74
+ "cosine",
75
+ "--warmup_ratio",
76
+ "0.03",
77
+ "--report_to",
78
+ "wandb",
79
+ "--run_name",
80
+ "qwen3asr_dapo_reward56_4x4x12_12gen_4GPU",
81
+ "--output_dir",
82
+ "/mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/0416upload/out/qwen3asr_dapo_reward56_4x4x12_12gen_4GPU",
83
+ "--save_strategy",
84
+ "steps",
85
+ "--save_steps",
86
+ "20",
87
+ "--logging_steps",
88
+ "5",
89
+ "--freeze_llm",
90
+ "false",
91
+ "--freeze_vit",
92
+ "false",
93
+ "--freeze_aligner",
94
+ "false",
95
+ "--remove_unused_columns",
96
+ "false",
97
+ "--padding_side",
98
+ "left"
99
+ ],
100
+ "program": "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/lib/python3.10/site-packages/swift/cli/rlhf.py",
101
+ "email": "pang_kaiyu@163.com",
102
+ "root": "/mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/0416upload",
103
+ "host": "SH-IDC1-10-140-37-95",
104
+ "executable": "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/bin/python3.10",
105
+ "cpu_count": 64,
106
+ "cpu_count_logical": 128,
107
+ "gpu": "NVIDIA A100-SXM4-80GB",
108
+ "gpu_count": 8,
109
+ "disk": {
110
+ "/": {
111
+ "total": "524945911808",
112
+ "used": "37367128064"
113
+ }
114
+ },
115
+ "memory": {
116
+ "total": "1081627828224"
117
+ },
118
+ "gpu_nvidia": [
119
+ {
120
+ "name": "NVIDIA A100-SXM4-80GB",
121
+ "memoryTotal": "85899345920",
122
+ "cudaCores": 6912,
123
+ "architecture": "Ampere",
124
+ "uuid": "GPU-87e7e3ab-b254-fc22-7407-8e2e88e9d854"
125
+ },
126
+ {
127
+ "name": "NVIDIA A100-SXM4-80GB",
128
+ "memoryTotal": "85899345920",
129
+ "cudaCores": 6912,
130
+ "architecture": "Ampere",
131
+ "uuid": "GPU-976db8a1-cf00-11c6-caaa-413862233fd4"
132
+ },
133
+ {
134
+ "name": "NVIDIA A100-SXM4-80GB",
135
+ "memoryTotal": "85899345920",
136
+ "cudaCores": 6912,
137
+ "architecture": "Ampere",
138
+ "uuid": "GPU-78b37ae8-44e0-e318-a6c0-f6f4ac78d46a"
139
+ },
140
+ {
141
+ "name": "NVIDIA A100-SXM4-80GB",
142
+ "memoryTotal": "85899345920",
143
+ "cudaCores": 6912,
144
+ "architecture": "Ampere",
145
+ "uuid": "GPU-840b937d-a7d4-68e7-ad57-f4568e01c3ae"
146
+ },
147
+ {
148
+ "name": "NVIDIA A100-SXM4-80GB",
149
+ "memoryTotal": "85899345920",
150
+ "cudaCores": 6912,
151
+ "architecture": "Ampere",
152
+ "uuid": "GPU-a9d0de54-f5b5-f83b-7bda-f53db844622d"
153
+ },
154
+ {
155
+ "name": "NVIDIA A100-SXM4-80GB",
156
+ "memoryTotal": "85899345920",
157
+ "cudaCores": 6912,
158
+ "architecture": "Ampere",
159
+ "uuid": "GPU-cb7d22e9-305c-c68c-64f1-599580742db0"
160
+ },
161
+ {
162
+ "name": "NVIDIA A100-SXM4-80GB",
163
+ "memoryTotal": "85899345920",
164
+ "cudaCores": 6912,
165
+ "architecture": "Ampere",
166
+ "uuid": "GPU-8d9704bb-4592-346f-a7f2-1a6ed8d58619"
167
+ },
168
+ {
169
+ "name": "NVIDIA A100-SXM4-80GB",
170
+ "memoryTotal": "85899345920",
171
+ "cudaCores": 6912,
172
+ "architecture": "Ampere",
173
+ "uuid": "GPU-3892f01b-e0b8-a9d9-0587-b5a7d2d9b5ab"
174
+ }
175
+ ],
176
+ "cudaVersion": "12.4",
177
+ "slurm": {
178
+ "cluster_name": "cluster_sproject3",
179
+ "conf": "/etc/slurm/slurm.conf",
180
+ "cpus_on_node": "2",
181
+ "gtids": "0",
182
+ "job_account": "research",
183
+ "job_cpus_per_node": "2",
184
+ "job_gid": "800000689",
185
+ "job_id": "8568770",
186
+ "job_name": "qwen_debug",
187
+ "job_nodelist": "SH-IDC1-10-140-37-95",
188
+ "job_num_nodes": "1",
189
+ "job_partition": "interntmp",
190
+ "job_qos": "normal",
191
+ "job_uid": "800000689",
192
+ "job_user": "panjiabao",
193
+ "jobid": "8568770",
194
+ "launch_node_ipaddr": "10.140.37.164",
195
+ "localid": "0",
196
+ "nnodes": "1",
197
+ "nodeid": "0",
198
+ "nodelist": "SH-IDC1-10-140-37-95",
199
+ "nprocs": "1",
200
+ "ntasks": "1",
201
+ "prio_process": "0",
202
+ "procid": "0",
203
+ "srun_comm_host": "10.140.37.164",
204
+ "srun_comm_port": "36403",
205
+ "step_gpus": "6,7",
206
+ "step_id": "0",
207
+ "step_launcher_port": "36403",
208
+ "step_nodelist": "SH-IDC1-10-140-37-95",
209
+ "step_num_nodes": "1",
210
+ "step_num_tasks": "1",
211
+ "step_tasks_per_node": "1",
212
+ "stepid": "0",
213
+ "submit_dir": "/mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/0416upload",
214
+ "submit_host": "SH-IDC1-10-140-37-164",
215
+ "task_pid": "31135",
216
+ "tasks_per_node": "1",
217
+ "topology_addr": "SH-IDC1-10-140-37-95",
218
+ "topology_addr_pattern": "node",
219
+ "umask": "0002",
220
+ "working_cluster": "cluster_sproject3:SH-IDC1-10-140-37-161:6817:9216:109"
221
+ },
222
+ "writerId": "sxwlerlqfwjgxrof5mrowpggo62a230u"
223
+ }
wandb/run-20260417_122253-6ntp64iz/files/wandb-summary.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"_wandb":{"runtime":2},"_runtime":2}
wandb/run-20260417_122253-6ntp64iz/logs/debug-core.log ADDED
@@ -0,0 +1,12 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {"time":"2026-04-17T12:22:53.678333465+08:00","level":"INFO","msg":"main: starting server","port-filename":"/tmp/tmpo93po4ye/port-45975.txt","pid":45975,"log-level":0,"disable-analytics":false,"shutdown-on-parent-exit":false,"enable-dcgm-profiling":false}
2
+ {"time":"2026-04-17T12:22:53.680473688+08:00","level":"INFO","msg":"server: will exit if parent process dies","ppid":45975}
3
+ {"time":"2026-04-17T12:22:53.680744122+08:00","level":"INFO","msg":"server: accepting connections","addr":{"Name":"/tmp/wandb-45975-46467-1709368994/socket","Net":"unix"}}
4
+ {"time":"2026-04-17T12:22:53.762137433+08:00","level":"INFO","msg":"connection: ManageConnectionData: new connection created","id":"1(@)"}
5
+ {"time":"2026-04-17T12:22:53.771267911+08:00","level":"INFO","msg":"handleInformInit: received","streamId":"6ntp64iz","id":"1(@)"}
6
+ {"time":"2026-04-17T12:22:54.22640511+08:00","level":"INFO","msg":"handleInformInit: stream started","streamId":"6ntp64iz","id":"1(@)"}
7
+ {"time":"2026-04-17T12:22:57.706591473+08:00","level":"INFO","msg":"handleInformTeardown: server teardown initiated","id":"1(@)"}
8
+ {"time":"2026-04-17T12:22:57.707133174+08:00","level":"INFO","msg":"server is shutting down"}
9
+ {"time":"2026-04-17T12:22:57.707126026+08:00","level":"INFO","msg":"connection: closing","id":"1(@)"}
10
+ {"time":"2026-04-17T12:22:57.707711702+08:00","level":"INFO","msg":"server: listener closed","addr":{"Name":"/tmp/wandb-45975-46467-1709368994/socket","Net":"unix"}}
11
+ {"time":"2026-04-17T12:22:57.708226504+08:00","level":"INFO","msg":"connection: closed successfully","id":"1(@)"}
12
+ {"time":"2026-04-17T12:22:57.795817111+08:00","level":"INFO","msg":"server: parent process exited, terminating service process"}
wandb/run-20260417_122253-6ntp64iz/logs/debug-internal.log ADDED
@@ -0,0 +1,7 @@
 
 
 
 
 
 
 
 
1
+ {"time":"2026-04-17T12:22:53.773961459+08:00","level":"INFO","msg":"stream: starting","core version":"0.23.0"}
2
+ {"time":"2026-04-17T12:22:54.222742714+08:00","level":"INFO","msg":"stream: created new stream","id":"6ntp64iz"}
3
+ {"time":"2026-04-17T12:22:54.222847789+08:00","level":"INFO","msg":"handler: started","stream_id":"6ntp64iz"}
4
+ {"time":"2026-04-17T12:22:54.226396493+08:00","level":"INFO","msg":"stream: started","id":"6ntp64iz"}
5
+ {"time":"2026-04-17T12:22:54.22641049+08:00","level":"INFO","msg":"sender: started","stream_id":"6ntp64iz"}
6
+ {"time":"2026-04-17T12:22:54.226419522+08:00","level":"INFO","msg":"writer: started","stream_id":"6ntp64iz"}
7
+ {"time":"2026-04-17T12:22:57.70713564+08:00","level":"INFO","msg":"stream: closing","id":"6ntp64iz"}
wandb/run-20260417_122253-6ntp64iz/logs/debug.log ADDED
@@ -0,0 +1,26 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ 2026-04-17 12:22:53,409 INFO MainThread:45975 [wandb_setup.py:_flush():80] Current SDK version is 0.23.0
2
+ 2026-04-17 12:22:53,409 INFO MainThread:45975 [wandb_setup.py:_flush():80] Configure stats pid to 45975
3
+ 2026-04-17 12:22:53,409 INFO MainThread:45975 [wandb_setup.py:_flush():80] Loading settings from /mnt/petrelfs/panjiabao/.config/wandb/settings
4
+ 2026-04-17 12:22:53,409 INFO MainThread:45975 [wandb_setup.py:_flush():80] Loading settings from /mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/0416upload/wandb/settings
5
+ 2026-04-17 12:22:53,409 INFO MainThread:45975 [wandb_setup.py:_flush():80] Loading settings from environment variables
6
+ 2026-04-17 12:22:53,409 INFO MainThread:45975 [wandb_init.py:setup_run_log_directory():713] Logging user logs to /mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/0416upload/wandb/run-20260417_122253-6ntp64iz/logs/debug.log
7
+ 2026-04-17 12:22:53,409 INFO MainThread:45975 [wandb_init.py:setup_run_log_directory():714] Logging internal logs to /mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/0416upload/wandb/run-20260417_122253-6ntp64iz/logs/debug-internal.log
8
+ 2026-04-17 12:22:53,409 INFO MainThread:45975 [wandb_init.py:init():840] calling init triggers
9
+ 2026-04-17 12:22:53,409 INFO MainThread:45975 [wandb_init.py:init():845] wandb.init called with sweep_config: {}
10
+ config: {'_wandb': {}}
11
+ 2026-04-17 12:22:53,409 INFO MainThread:45975 [wandb_init.py:init():888] starting backend
12
+ 2026-04-17 12:22:53,762 INFO MainThread:45975 [wandb_init.py:init():891] sending inform_init request
13
+ 2026-04-17 12:22:53,766 INFO MainThread:45975 [wandb_init.py:init():899] backend started and connected
14
+ 2026-04-17 12:22:53,768 INFO MainThread:45975 [wandb_init.py:init():969] updated telemetry
15
+ 2026-04-17 12:22:53,769 INFO MainThread:45975 [wandb_init.py:init():993] communicating run to backend with 90.0 second timeout
16
+ 2026-04-17 12:22:55,268 INFO MainThread:45975 [wandb_init.py:init():1040] starting run threads in backend
17
+ 2026-04-17 12:22:55,848 INFO MainThread:45975 [wandb_run.py:_console_start():2504] atexit reg
18
+ 2026-04-17 12:22:55,848 INFO MainThread:45975 [wandb_run.py:_redirect():2352] redirect: wrap_raw
19
+ 2026-04-17 12:22:55,848 INFO MainThread:45975 [wandb_run.py:_redirect():2421] Wrapping output streams.
20
+ 2026-04-17 12:22:55,848 INFO MainThread:45975 [wandb_run.py:_redirect():2444] Redirects installed.
21
+ 2026-04-17 12:22:55,854 INFO MainThread:45975 [wandb_init.py:init():1080] run started, returning control to user process
22
+ 2026-04-17 12:22:55,859 INFO MainThread:45975 [wandb_run.py:_config_callback():1385] config_cb None None {'peft_config': {'default': {'task_type': 'CAUSAL_LM', 'peft_type': 'LORA', 'auto_mapping': None, 'peft_version': '0.18.1', 'base_model_name_or_path': '/mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/qwen3-asr-merged', 'revision': None, 'inference_mode': False, 'r': 8, 'target_modules': '^(thinker\\.model(?=\\.).*\\.(v_proj|down_proj|gate_proj|q_proj|o_proj|k_proj|up_proj)|thinker\\.audio_tower\\.layers(?=\\.).*\\.(v_proj|fc2|fc1|out_proj|q_proj|k_proj)|thinker\\.audio_tower\\.conv_out(?=\\.)|thinker\\.audio_tower\\.proj1(?=\\.)|thinker\\.audio_tower\\.proj2(?=\\.))$', 'exclude_modules': None, 'lora_alpha': 32, 'lora_dropout': 0.05, 'fan_in_fan_out': False, 'bias': 'none', 'use_rslora': False, 'modules_to_save': [], 'init_lora_weights': True, 'layers_to_transform': None, 'layers_pattern': None, 'rank_pattern': {}, 'alpha_pattern': {}, 'megatron_config': None, 'megatron_core': 'megatron.core', 'trainable_token_indices': None, 'loftq_config': {}, 'eva_config': None, 'corda_config': None, 'use_dora': False, 'alora_invocation_tokens': None, 'use_qalora': False, 'qalora_group_size': 16, 'layer_replication': None, 'runtime_config': {'ephemeral_gpu_offload': False}, 'lora_bias': False, 'target_parameters': None, 'arrow_config': None, 'ensure_weight_tying': False, 'lora_dtype': None, 'lorap_lr_ratio': None, 'lorap_emb_lr': 1e-06}}, 'return_dict': True, 'output_hidden_states': False, 'torchscript': False, 'dtype': 'bfloat16', 'pruned_heads': {}, 'tie_word_embeddings': True, 'chunk_size_feed_forward': 0, 'is_encoder_decoder': False, 'is_decoder': False, 'cross_attention_hidden_size': None, 'add_cross_attention': False, 'tie_encoder_decoder': False, 'architectures': ['Qwen3ASRForConditionalGeneration'], 'finetuning_task': None, 'id2label': {0: 'LABEL_0', 1: 'LABEL_1'}, 'label2id': {'LABEL_0': 0, 'LABEL_1': 1}, 'task_specific_params': None, 'problem_type': None, 'tokenizer_class': None, 'prefix': None, 'bos_token_id': None, 'pad_token_id': 151643, 'eos_token_id': 151645, 'sep_token_id': None, 'decoder_start_token_id': None, 'max_length': 20, 'min_length': 0, 'do_sample': False, 'early_stopping': False, 'num_beams': 1, 'temperature': 0.5, 'top_k': 50, 'top_p': 0.95, 'typical_p': 1.0, 'repetition_penalty': 1.08, 'length_penalty': 1.0, 'no_repeat_ngram_size': 0, 'encoder_no_repeat_ngram_size': 0, 'bad_words_ids': None, 'num_return_sequences': 1, 'output_scores': False, 'return_dict_in_generate': False, 'forced_bos_token_id': None, 'forced_eos_token_id': None, 'remove_invalid_values': False, 'exponential_decay_length_penalty': None, 'suppress_tokens': None, 'begin_suppress_tokens': None, 'num_beam_groups': 1, 'diversity_penalty': 0.0, '_name_or_path': '/mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/qwen3-asr-merged', 'transformers_version': '4.57.6', 'model_type': 'qwen3_asr', 'tf_legacy_loss': False, 'use_bfloat16': False, 'thinker_config': {'return_dict': True, 'output_hidden_states': False, 'torchscript': False, 'dtype': 'bfloat16', 'pruned_heads': {}, 'tie_word_embeddings': True, 'chunk_size_feed_forward': 0, 'is_encoder_decoder': False, 'is_decoder': False, 'cross_attention_hidden_size': None, 'add_cross_attention': False, 'tie_encoder_decoder': False, 'architectures': ['Qwen3ASRForConditionalGeneration'], 'finetuning_task': None, 'id2label': {0: 'LABEL_0', 1: 'LABEL_1'}, 'label2id': {'LABEL_0': 0, 'LABEL_1': 1}, 'task_specific_params': None, 'problem_type': None, 'tokenizer_class': None, 'prefix': None, 'bos_token_id': None, 'pad_token_id': None, 'eos_token_id': None, 'sep_token_id': None, 'decoder_start_token_id': None, 'max_length': 20, 'min_length': 0, 'do_sample': False, 'early_stopping': False, 'num_beams': 1, 'temperature': 1.0, 'top_k': 50, 'top_p': 1.0, 'typical_p': 1.0, 'repetition_penalty': 1.0, 'length_penalty': 1.0, 'no_repeat_ngram_size': 0, 'encoder_no_repeat_ngram_size': 0, 'bad_words_ids': None, 'num_return_sequences': 1, 'output_scores': False, 'return_dict_in_generate': False, 'forced_bos_token_id': None, 'forced_eos_token_id': None, 'remove_invalid_values': False, 'exponential_decay_length_penalty': None, 'suppress_tokens': None, 'begin_suppress_tokens': None, 'num_beam_groups': 1, 'diversity_penalty': 0.0, '_name_or_path': '', 'audio_end_token_id': 151670, 'model_type': 'qwen3_asr_thinker', 'tf_legacy_loss': False, 'use_bfloat16': False, 'user_token_id': 872, 'audio_start_token_id': 151669, 'initializer_range': 0.02, 'audio_config': {'return_dict': True, 'output_hidden_states': False, 'torchscript': False, 'dtype': None, 'pruned_heads': {}, 'tie_word_embeddings': True, 'chunk_size_feed_forward': 0, 'is_encoder_decoder': False, 'is_decoder': False, 'cross_attention_hidden_size': None, 'add_cross_attention': False, 'tie_encoder_decoder': False, 'architectures': None, 'finetuning_task': None, 'id2label': {0: 'LABEL_0', 1: 'LABEL_1'}, 'label2id': {'LABEL_0': 0, 'LABEL_1': 1}, 'task_specific_params': None, 'problem_type': None, 'tokenizer_class': None, 'prefix': None, 'bos_token_id': None, 'pad_token_id': None, 'eos_token_id': None, 'sep_token_id': None, 'decoder_start_token_id': None, 'max_length': 20, 'min_length': 0, 'do_sample': False, 'early_stopping': False, 'num_beams': 1, 'temperature': 1.0, 'top_k': 50, 'top_p': 1.0, 'typical_p': 1.0, 'repetition_penalty': 1.0, 'length_penalty': 1.0, 'no_repeat_ngram_size': 0, 'encoder_no_repeat_ngram_size': 0, 'bad_words_ids': None, 'num_return_sequences': 1, 'output_scores': False, 'return_dict_in_generate': False, 'forced_bos_token_id': None, 'forced_eos_token_id': None, 'remove_invalid_values': False, 'exponential_decay_length_penalty': None, 'suppress_tokens': None, 'begin_suppress_tokens': None, 'num_beam_groups': 1, 'diversity_penalty': 0.0, '_name_or_path': '', 'model_type': 'qwen3_asr_audio_encoder', 'num_hidden_layers': 24, 'tf_legacy_loss': False, 'use_bfloat16': False, 'num_mel_bins': 128, 'd_model': 1024, 'encoder_layers': 24, 'encoder_attention_heads': 16, 'encoder_ffn_dim': 4096, 'dropout': 0, 'attention_dropout': 0, 'activation_function': 'gelu', 'activation_dropout': 0, 'initializer_range': 0.02, 'scale_embedding': False, 'max_source_positions': 1500, 'n_window': 50, 'output_dim': 2048, 'n_window_infer': 800, 'conv_chunksize': 500, 'downsample_hidden_size': 480, 'output_attentions': False}, 'text_config': {'vocab_size': 151936, 'max_position_embeddings': 65536, 'hidden_size': 2048, 'intermediate_size': 6144, 'num_hidden_layers': 28, 'num_attention_heads': 16, 'num_key_value_heads': 8, 'head_dim': 128, 'hidden_act': 'silu', 'initializer_range': 0.02, 'rms_norm_eps': 1e-06, 'use_cache': False, 'rope_theta': 1000000, 'rope_scaling': {'interleaved': True, 'mrope_interleaved': True, 'mrope_section': [24, 20, 20], 'rope_type': 'default', 'type': 'default'}, 'attention_bias': False, 'attention_dropout': 0.0, 'return_dict': True, 'output_hidden_states': False, 'torchscript': False, 'dtype': None, 'pruned_heads': {}, 'tie_word_embeddings': True, 'chunk_size_feed_forward': 0, 'is_encoder_decoder': False, 'is_decoder': False, 'cross_attention_hidden_size': None, 'add_cross_attention': False, 'tie_encoder_decoder': False, 'architectures': None, 'finetuning_task': None, 'id2label': {0: 'LABEL_0', 1: 'LABEL_1'}, 'label2id': {'LABEL_0': 0, 'LABEL_1': 1}, 'task_specific_params': None, 'problem_type': None, 'tokenizer_class': None, 'prefix': None, 'bos_token_id': None, 'pad_token_id': 151643, 'eos_token_id': None, 'sep_token_id': None, 'decoder_start_token_id': None, 'max_length': 20, 'min_length': 0, 'do_sample': False, 'early_stopping': False, 'num_beams': 1, 'temperature': 1.0, 'top_k': 50, 'top_p': 1.0, 'typical_p': 1.0, 'repetition_penalty': 1.0, 'length_penalty': 1.0, 'no_repeat_ngram_size': 0, 'encoder_no_repeat_ngram_size': 0, 'bad_words_ids': None, 'num_return_sequences': 1, 'output_scores': False, 'return_dict_in_generate': False, 'forced_bos_token_id': None, 'forced_eos_token_id': None, 'remove_invalid_values': False, 'exponential_decay_length_penalty': None, 'suppress_tokens': None, 'begin_suppress_tokens': None, 'num_beam_groups': 1, 'diversity_penalty': 0.0, '_name_or_path': '', 'model_type': 'qwen3_asr_text', 'tf_legacy_loss': False, 'use_bfloat16': False, 'output_attentions': False}, 'audio_token_id': 151676, 'output_attentions': False}, 'support_languages': ['Chinese', 'English', 'Cantonese', 'Arabic', 'German', 'French', 'Spanish', 'Portuguese', 'Indonesian', 'Italian', 'Korean', 'Russian', 'Thai', 'Vietnamese', 'Japanese', 'Turkish', 'Hindi', 'Malay', 'Dutch', 'Swedish', 'Danish', 'Finnish', 'Polish', 'Czech', 'Filipino', 'Persian', 'Greek', 'Romanian', 'Hungarian', 'Macedonian'], 'output_attentions': False, 'output_dir': '/mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/0416upload/out/qwen3asr_dapo_reward56_4x4x12_12gen_4GPU/v2-20260417-122243', 'overwrite_output_dir': False, 'do_train': False, 'do_eval': True, 'do_predict': False, 'eval_strategy': 'steps', 'prediction_loss_only': False, 'per_device_train_batch_size': 8, 'per_device_eval_batch_size': 8, 'per_gpu_train_batch_size': None, 'per_gpu_eval_batch_size': None, 'gradient_accumulation_steps': 12, 'eval_accumulation_steps': None, 'eval_delay': 0, 'torch_empty_cache_steps': None, 'learning_rate': 5e-05, 'weight_decay': 0.1, 'adam_beta1': 0.9, 'adam_beta2': 0.95, 'adam_epsilon': 1e-08, 'max_grad_norm': 1.0, 'num_train_epochs': 3.0, 'max_steps': -1, 'lr_scheduler_type': 'cosine', 'lr_scheduler_kwargs': None, 'warmup_ratio': 0.03, 'warmup_steps': 0, 'log_level': 'passive', 'log_level_replica': 'warning', 'log_on_each_node': True, 'logging_dir': '/mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/0416upload/out/qwen3asr_dapo_reward56_4x4x12_12gen_4GPU/v2-20260417-122243/runs', 'logging_strategy': 'steps', 'logging_first_step': True, 'logging_steps': 5, 'logging_nan_inf_filter': True, 'save_strategy': 'steps', 'save_steps': 20, 'save_total_limit': None, 'save_safetensors': True, 'save_on_each_node': False, 'save_only_model': False, 'restore_callback_states_from_checkpoint': False, 'no_cuda': False, 'use_cpu': False, 'use_mps_device': False, 'seed': 42, 'data_seed': 42, 'jit_mode_eval': False, 'bf16': True, 'fp16': False, 'fp16_opt_level': 'O1', 'half_precision_backend': 'auto', 'bf16_full_eval': False, 'fp16_full_eval': False, 'tf32': None, 'local_rank': 0, 'ddp_backend': None, 'tpu_num_cores': None, 'tpu_metrics_debug': False, 'debug': [], 'dataloader_drop_last': True, 'eval_steps': 20, 'dataloader_num_workers': 1, 'dataloader_prefetch_factor': 2, 'past_index': -1, 'run_name': 'qwen3asr_dapo_reward56_4x4x12_12gen_4GPU', 'disable_tqdm': False, 'remove_unused_columns': False, 'label_names': None, 'load_best_model_at_end': False, 'metric_for_best_model': 'loss', 'greater_is_better': False, 'ignore_data_skip': False, 'fsdp': [], 'fsdp_min_num_params': 0, 'fsdp_config': {'min_num_params': 0, 'xla': False, 'xla_fsdp_v2': False, 'xla_fsdp_grad_ckpt': False}, 'fsdp_transformer_layer_cls_to_wrap': None, 'accelerator_config': {'split_batches': False, 'dispatch_batches': False, 'even_batches': True, 'use_seedable_sampler': True, 'non_blocking': False, 'gradient_accumulation_kwargs': None}, 'parallelism_config': None, 'deepspeed': None, 'label_smoothing_factor': 0.0, 'optim': 'adamw_torch', 'optim_args': None, 'adafactor': False, 'group_by_length': False, 'length_column_name': 'length', 'report_to': ['wandb'], 'project': 'huggingface', 'trackio_space_id': 'trackio', 'ddp_find_unused_parameters': None, 'ddp_bucket_cap_mb': None, 'ddp_broadcast_buffers': None, 'dataloader_pin_memory': True, 'dataloader_persistent_workers': False, 'skip_memory_metrics': True, 'use_legacy_prediction_loop': False, 'push_to_hub': False, 'resume_from_checkpoint': None, 'hub_model_id': None, 'hub_strategy': 'every_save', 'hub_token': '<HUB_TOKEN>', 'hub_private_repo': None, 'hub_always_push': False, 'hub_revision': None, 'gradient_checkpointing': False, 'gradient_checkpointing_kwargs': None, 'include_inputs_for_metrics': False, 'include_for_metrics': [], 'eval_do_concat_batches': True, 'fp16_backend': 'auto', 'push_to_hub_model_id': None, 'push_to_hub_organization': None, 'push_to_hub_token': '<PUSH_TO_HUB_TOKEN>', 'mp_parameters': '', 'auto_find_batch_size': False, 'full_determinism': False, 'torchdynamo': None, 'ray_scope': 'last', 'ddp_timeout': 18000000, 'torch_compile': False, 'torch_compile_backend': None, 'torch_compile_mode': None, 'include_tokens_per_second': False, 'include_num_input_tokens_seen': 'no', 'neftune_noise_alpha': None, 'optim_target_modules': None, 'batch_eval_metrics': False, 'eval_on_start': False, 'use_liger_kernel': False, 'liger_kernel_config': None, 'eval_use_gather_object': False, 'average_tokens_across_devices': True, 'model_init_kwargs': None, 'disable_dropout': False, 'cast_lm_head_to_fp32': False, 'num_generations': 12, 'num_generations_eval': 4, 'max_completion_length': 256, 'ds3_gather_for_generation': True, 'shuffle_dataset': True, 'generation_batch_size': 48, 'steps_per_generation': 3, 'min_p': None, 'generation_kwargs': None, 'chat_template_kwargs': None, 'use_transformers_paged': False, 'cache_implementation': None, 'use_vllm': False, 'vllm_mode': None, 'vllm_model_impl': 'vllm', 'vllm_enable_sleep_mode': False, 'vllm_structured_outputs_regex': None, 'vllm_server_base_url': None, 'vllm_server_host': None, 'vllm_server_port': [8000], 'vllm_server_timeout': 240.0, 'vllm_group_port': 51216, 'vllm_gpu_memory_utilization': 0.9, 'vllm_max_model_length': None, 'vllm_tensor_parallel_size': 1, 'beta': 0.04, 'num_iterations': 2, 'epsilon': 0.2, 'delta': None, 'epsilon_high': 0.28, 'sapo_temperature_neg': 1.05, 'sapo_temperature_pos': 1.0, 'importance_sampling_level': 'token', 'reward_weights': None, 'multi_objective_aggregation': 'sum_then_normalize', 'scale_rewards': 'group', 'loss_type': 'dapo', 'mask_truncated_completions': False, 'sync_ref_model': False, 'ref_model_mixup_alpha': 0.6, 'ref_model_sync_steps': 512, 'top_entropy_quantile': 1.0, 'max_tool_calling_iterations': None, 'vllm_importance_sampling_correction': True, 'vllm_importance_sampling_mode': 'sequence_mask', 'vllm_importance_sampling_cap': 3.0, 'off_policy_mask_threshold': None, 'use_bias_correction_kl': False, 'log_completions': True, 'num_completions_to_print': None, 'log_unique_prompts': False, 'log_completions_hub_repo': None, 'tuner_backend': 'peft', 'vit_gradient_checkpointing': True, 'router_aux_loss_coef': 0.0, 'enable_dft_loss': False, 'enable_channel_loss': False, 'safe_serialization': True, 'max_shard_size': '5GB', 'check_model': True, 'acc_strategy': 'token', 'train_dataloader_shuffle': True, 'max_epochs': None, 'aligner_lr': None, 'vit_lr': None, 'use_logits_to_keep': None, 'resume_only_model': False, 'optimizer': None, 'eval_metric': None, 'callbacks': [], 'early_stop_interval': None, 'eval_use_evalscope': False, 'eval_dataset': [], 'eval_dataset_args': None, 'eval_limit': None, 'eval_generation_config': None, 'extra_eval_args': None, 'tuner_type': 'lora', 'use_galore': False, 'galore_target_modules': None, 'galore_rank': 128, 'galore_update_proj_gap': 50, 'galore_scale': 1.0, 'galore_proj_type': 'std', 'galore_optim_per_parameter': False, 'galore_with_embedding': False, 'galore_quantization': False, 'galore_proj_quant': False, 'galore_proj_bits': 4, 'galore_proj_group_size': 256, 'galore_cos_threshold': 0.4, 'galore_gamma_proj': 2, 'galore_queue_size': 5, 'lisa_activated_layers': 0, 'lisa_step_interval': 20, 'use_flash_ckpt': False, 'vllm_pipeline_parallel_size': 1, 'vllm_enable_expert_parallel': False, 'vllm_max_num_seqs': None, 'vllm_max_model_len': None, 'vllm_disable_custom_all_reduce': True, 'vllm_enforce_eager': False, 'vllm_limit_mm_per_prompt': None, 'vllm_max_lora_rank': 16, 'vllm_enable_prefix_caching': True, 'vllm_use_async_engine': None, 'vllm_quantization': None, 'vllm_reasoning_parser': None, 'vllm_disable_cascade_attn': False, 'vllm_mm_processor_cache_gb': None, 'vllm_speculative_config': None, 'vllm_engine_kwargs': {}, 'vllm_data_parallel_size': 1, 'stop_words': [], 'vllm_enable_lora': False, 'lora_rank': 8, 'vllm_server_group_port': None, 'enable_flattened_weight_sync': True, 'async_generate': False, 'structured_outputs_regex': None, 'sleep_level': 0, 'move_model_batches': None, 'offload_optimizer': False, 'offload_model': False, 'wandb_log_unique_prompts': None, 'cosine_min_len_value_wrong': -0.5, 'cosine_max_len_value_wrong': 0.0, 'cosine_min_len_value_correct': 1.0, 'cosine_max_len_value_correct': 0.5, 'cosine_max_len': 256, 'repetition_n_grams': 3, 'repetition_max_penalty': -1.0, 'reward_model': None, 'reward_model_plugin': None, 'chord_sft_dataset': [], 'chord_sft_per_device_train_batch_size': None, 'chord_enable_phi_function': False, 'chord_mu_warmup_steps': None, 'chord_mu_decay_steps': None, 'chord_mu_peak': None, 'chord_mu_valley': None, 'multi_turn_scheduler': None, 'max_turns': None, 'completion_length_limit_scope': 'per_round', 'vllm_server_pass_dataset': False, 'dynamic_sample': True, 'max_resample_times': 4, 'overlong_filter': True, 'soft_max_length': None, 'soft_cache_length': None, 'log_entropy': False, 'tau_pos': 1.0, 'tau_neg': 1.05, 'advantage_estimator': 'grpo', 'kl_in_reward': False, 'dataset_shuffle': True, 'rollout_importance_sampling_mode': None, 'rollout_importance_sampling_threshold': 2.0, 'log_rollout_offpolicy_metrics': False, 'off_policy_sequence_mask_delta': None}
23
+ 2026-04-17 12:22:55,870 INFO MainThread:45975 [wandb_config.py:__setitem__():154] [no run ID] config set model/num_parameters = 2050307712 - <bound method Run._config_callback of <wandb.sdk.wandb_run.Run object at 0x7fe90873e920>>
24
+ 2026-04-17 12:22:55,870 INFO MainThread:45975 [wandb_run.py:_config_callback():1385] config_cb model/num_parameters 2050307712 None
25
+ 2026-04-17 12:22:57,706 INFO wandb-AsyncioManager-main:45975 [service_client.py:_forward_responses():80] Reached EOF.
26
+ 2026-04-17 12:22:57,707 INFO wandb-AsyncioManager-main:45975 [mailbox.py:close():137] Closing mailbox, abandoning 1 handles.
wandb/run-20260417_123237-3h84yfea/files/config.yaml ADDED
@@ -0,0 +1,1272 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ _name_or_path:
2
+ value: /mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/qwen3-asr-merged
3
+ _wandb:
4
+ value:
5
+ cli_version: 0.23.0
6
+ e:
7
+ bpic2cpmtxvnwca2pu2tg19g1j2qwpb2:
8
+ args:
9
+ - --rlhf_type
10
+ - grpo
11
+ - --external_plugins
12
+ - /mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/0416upload/my_qwen3_asr_dapo_register.py
13
+ - /mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/0416upload/0417_reward.py
14
+ - --model
15
+ - /mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/qwen3-asr-merged
16
+ - --model_type
17
+ - my_qwen3_asr_rl
18
+ - --template
19
+ - my_qwen3_asr_rl
20
+ - --dataset
21
+ - /mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/0416upload/lora_0323_10w+55w+error+syn_with_domain_train90_targeted_rl_train90_loramerged_basewer_3suppress_server.jsonl
22
+ - --val_dataset
23
+ - /mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/0416upload/lora_0323_10w+55w+error+syn_with_domain_train90_targeted_rl_val5_sample5p_server.jsonl
24
+ - --reward_funcs
25
+ - asr_wer_sub_len_cmp_hallu_dirty_v56
26
+ - --train_type
27
+ - lora
28
+ - --use_vllm
29
+ - "false"
30
+ - --log_completions
31
+ - "true"
32
+ - --loss_type
33
+ - dapo
34
+ - --advantage_estimator
35
+ - grpo
36
+ - --scale_rewards
37
+ - group
38
+ - --num_iterations
39
+ - "2"
40
+ - --beta
41
+ - "0.04"
42
+ - --epsilon_high
43
+ - "0.28"
44
+ - --dynamic_sample
45
+ - "true"
46
+ - --max_resample_times
47
+ - "4"
48
+ - --overlong_filter
49
+ - "true"
50
+ - --truncation_strategy
51
+ - delete
52
+ - --num_generations
53
+ - "12"
54
+ - --generation_batch_size
55
+ - "48"
56
+ - --per_device_train_batch_size
57
+ - "8"
58
+ - --per_device_eval_batch_size
59
+ - "8"
60
+ - --gradient_accumulation_steps
61
+ - "12"
62
+ - --num_generations_eval
63
+ - "4"
64
+ - --max_completion_length
65
+ - "256"
66
+ - --temperature
67
+ - "0.50"
68
+ - --top_p
69
+ - "0.95"
70
+ - --top_k
71
+ - "50"
72
+ - --repetition_penalty
73
+ - "1.08"
74
+ - --learning_rate
75
+ - "5e-5"
76
+ - --lr_scheduler_type
77
+ - cosine
78
+ - --warmup_ratio
79
+ - "0.03"
80
+ - --report_to
81
+ - wandb
82
+ - --run_name
83
+ - qwen3asr_dapo_reward56_4x4x12_12gen_4GPU
84
+ - --output_dir
85
+ - /mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/0416upload/out/qwen3asr_dapo_reward56_4x4x12_12gen_4GPU
86
+ - --save_strategy
87
+ - steps
88
+ - --save_steps
89
+ - "20"
90
+ - --logging_steps
91
+ - "5"
92
+ - --freeze_llm
93
+ - "false"
94
+ - --freeze_vit
95
+ - "false"
96
+ - --freeze_aligner
97
+ - "false"
98
+ - --remove_unused_columns
99
+ - "false"
100
+ - --padding_side
101
+ - left
102
+ cpu_count: 64
103
+ cpu_count_logical: 128
104
+ cudaVersion: "12.4"
105
+ disk:
106
+ /:
107
+ total: "524945911808"
108
+ used: "105544630272"
109
+ email: pang_kaiyu@163.com
110
+ executable: /mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/bin/python3.10
111
+ gpu: NVIDIA A100-SXM4-80GB
112
+ gpu_count: 8
113
+ gpu_nvidia:
114
+ - architecture: Ampere
115
+ cudaCores: 6912
116
+ memoryTotal: "85899345920"
117
+ name: NVIDIA A100-SXM4-80GB
118
+ uuid: GPU-51466de9-a668-3c7e-bb90-bb8c112e0fea
119
+ - architecture: Ampere
120
+ cudaCores: 6912
121
+ memoryTotal: "85899345920"
122
+ name: NVIDIA A100-SXM4-80GB
123
+ uuid: GPU-ec1a5f87-66dd-26c2-5656-b57c7015a595
124
+ - architecture: Ampere
125
+ cudaCores: 6912
126
+ memoryTotal: "85899345920"
127
+ name: NVIDIA A100-SXM4-80GB
128
+ uuid: GPU-2dabb104-8ec6-09ec-017a-204779e18c19
129
+ - architecture: Ampere
130
+ cudaCores: 6912
131
+ memoryTotal: "85899345920"
132
+ name: NVIDIA A100-SXM4-80GB
133
+ uuid: GPU-0e67540a-1930-f39b-320f-0a6bfe1da2e0
134
+ - architecture: Ampere
135
+ cudaCores: 6912
136
+ memoryTotal: "85899345920"
137
+ name: NVIDIA A100-SXM4-80GB
138
+ uuid: GPU-b46e583c-5ac8-e350-6045-49ad7b17c092
139
+ - architecture: Ampere
140
+ cudaCores: 6912
141
+ memoryTotal: "85899345920"
142
+ name: NVIDIA A100-SXM4-80GB
143
+ uuid: GPU-f293d16a-41a0-fbc1-e86c-4f9682cb5e2b
144
+ - architecture: Ampere
145
+ cudaCores: 6912
146
+ memoryTotal: "85899345920"
147
+ name: NVIDIA A100-SXM4-80GB
148
+ uuid: GPU-67958330-9199-dca8-5c2e-c665b13b3452
149
+ - architecture: Ampere
150
+ cudaCores: 6912
151
+ memoryTotal: "85899345920"
152
+ name: NVIDIA A100-SXM4-80GB
153
+ uuid: GPU-6b56602f-4dcf-cb9d-4e98-04bf6254b789
154
+ host: SH-IDC1-10-140-37-1
155
+ memory:
156
+ total: "1081627828224"
157
+ os: Linux-3.10.0-957.el7.x86_64-x86_64-with-glibc2.17
158
+ program: /mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/lib/python3.10/site-packages/swift/cli/rlhf.py
159
+ python: CPython 3.10.18
160
+ root: /mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/0416upload
161
+ slurm:
162
+ cluster_name: cluster_sproject3
163
+ conf: /etc/slurm/slurm.conf
164
+ cpus_on_node: "2"
165
+ gtids: "0"
166
+ job_account: research
167
+ job_cpus_per_node: "2"
168
+ job_gid: "800000689"
169
+ job_id: "8568802"
170
+ job_name: qwen_debug
171
+ job_nodelist: SH-IDC1-10-140-37-1
172
+ job_num_nodes: "1"
173
+ job_partition: interntmp
174
+ job_qos: normal
175
+ job_uid: "800000689"
176
+ job_user: panjiabao
177
+ jobid: "8568802"
178
+ launch_node_ipaddr: 10.140.37.164
179
+ localid: "0"
180
+ nnodes: "1"
181
+ nodeid: "0"
182
+ nodelist: SH-IDC1-10-140-37-1
183
+ nprocs: "1"
184
+ ntasks: "1"
185
+ prio_process: "0"
186
+ procid: "0"
187
+ srun_comm_host: 10.140.37.164
188
+ srun_comm_port: "44570"
189
+ step_gpus: 4,5
190
+ step_id: "0"
191
+ step_launcher_port: "44570"
192
+ step_nodelist: SH-IDC1-10-140-37-1
193
+ step_num_nodes: "1"
194
+ step_num_tasks: "1"
195
+ step_tasks_per_node: "1"
196
+ stepid: "0"
197
+ submit_dir: /mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/0416upload
198
+ submit_host: SH-IDC1-10-140-37-164
199
+ task_pid: "24357"
200
+ tasks_per_node: "1"
201
+ topology_addr: SH-IDC1-10-140-37-1
202
+ topology_addr_pattern: node
203
+ umask: "0002"
204
+ working_cluster: cluster_sproject3:SH-IDC1-10-140-37-161:6817:9216:109
205
+ startedAt: "2026-04-17T04:32:37.414555Z"
206
+ writerId: bpic2cpmtxvnwca2pu2tg19g1j2qwpb2
207
+ m:
208
+ - "1": train/global_step
209
+ "6":
210
+ - 3
211
+ "7": []
212
+ - "2": '*'
213
+ "5": 1
214
+ "6":
215
+ - 1
216
+ "7": []
217
+ python_version: 3.10.18
218
+ t:
219
+ "1":
220
+ - 1
221
+ - 5
222
+ - 11
223
+ - 30
224
+ - 41
225
+ - 49
226
+ - 51
227
+ - 53
228
+ - 71
229
+ - 84
230
+ - 95
231
+ - 98
232
+ - 105
233
+ "2":
234
+ - 1
235
+ - 5
236
+ - 11
237
+ - 30
238
+ - 41
239
+ - 49
240
+ - 51
241
+ - 53
242
+ - 71
243
+ - 84
244
+ - 95
245
+ - 98
246
+ - 105
247
+ "3":
248
+ - 7
249
+ - 13
250
+ - 19
251
+ - 66
252
+ "4": 3.10.18
253
+ "5": 0.23.0
254
+ "6": 4.57.6
255
+ "9":
256
+ "1": transformers_trainer
257
+ "12": 0.23.0
258
+ "13": linux-x86_64
259
+ acc_strategy:
260
+ value: token
261
+ accelerator_config:
262
+ value:
263
+ dispatch_batches: false
264
+ even_batches: true
265
+ gradient_accumulation_kwargs: null
266
+ non_blocking: false
267
+ split_batches: false
268
+ use_seedable_sampler: true
269
+ adafactor:
270
+ value: false
271
+ adam_beta1:
272
+ value: 0.9
273
+ adam_beta2:
274
+ value: 0.95
275
+ adam_epsilon:
276
+ value: 1e-08
277
+ add_cross_attention:
278
+ value: false
279
+ advantage_estimator:
280
+ value: grpo
281
+ aligner_lr:
282
+ value: null
283
+ architectures:
284
+ value:
285
+ - Qwen3ASRForConditionalGeneration
286
+ async_generate:
287
+ value: false
288
+ auto_find_batch_size:
289
+ value: false
290
+ average_tokens_across_devices:
291
+ value: true
292
+ bad_words_ids:
293
+ value: null
294
+ batch_eval_metrics:
295
+ value: false
296
+ begin_suppress_tokens:
297
+ value: null
298
+ beta:
299
+ value: 0.04
300
+ bf16:
301
+ value: true
302
+ bf16_full_eval:
303
+ value: false
304
+ bos_token_id:
305
+ value: null
306
+ cache_implementation:
307
+ value: null
308
+ callbacks:
309
+ value: []
310
+ cast_lm_head_to_fp32:
311
+ value: false
312
+ chat_template_kwargs:
313
+ value: null
314
+ check_model:
315
+ value: true
316
+ chord_enable_phi_function:
317
+ value: false
318
+ chord_mu_decay_steps:
319
+ value: null
320
+ chord_mu_peak:
321
+ value: null
322
+ chord_mu_valley:
323
+ value: null
324
+ chord_mu_warmup_steps:
325
+ value: null
326
+ chord_sft_dataset:
327
+ value: []
328
+ chord_sft_per_device_train_batch_size:
329
+ value: null
330
+ chunk_size_feed_forward:
331
+ value: 0
332
+ completion_length_limit_scope:
333
+ value: per_round
334
+ cosine_max_len:
335
+ value: 256
336
+ cosine_max_len_value_correct:
337
+ value: 0.5
338
+ cosine_max_len_value_wrong:
339
+ value: 0
340
+ cosine_min_len_value_correct:
341
+ value: 1
342
+ cosine_min_len_value_wrong:
343
+ value: -0.5
344
+ cross_attention_hidden_size:
345
+ value: null
346
+ data_seed:
347
+ value: 42
348
+ dataloader_drop_last:
349
+ value: true
350
+ dataloader_num_workers:
351
+ value: 1
352
+ dataloader_persistent_workers:
353
+ value: false
354
+ dataloader_pin_memory:
355
+ value: true
356
+ dataloader_prefetch_factor:
357
+ value: 2
358
+ dataset_shuffle:
359
+ value: true
360
+ ddp_backend:
361
+ value: null
362
+ ddp_broadcast_buffers:
363
+ value: null
364
+ ddp_bucket_cap_mb:
365
+ value: null
366
+ ddp_find_unused_parameters:
367
+ value: null
368
+ ddp_timeout:
369
+ value: 18000000
370
+ debug:
371
+ value: []
372
+ decoder_start_token_id:
373
+ value: null
374
+ deepspeed:
375
+ value: null
376
+ delta:
377
+ value: null
378
+ disable_dropout:
379
+ value: false
380
+ disable_tqdm:
381
+ value: false
382
+ diversity_penalty:
383
+ value: 0
384
+ do_eval:
385
+ value: true
386
+ do_predict:
387
+ value: false
388
+ do_sample:
389
+ value: false
390
+ do_train:
391
+ value: false
392
+ ds3_gather_for_generation:
393
+ value: true
394
+ dtype:
395
+ value: bfloat16
396
+ dynamic_sample:
397
+ value: true
398
+ early_stop_interval:
399
+ value: null
400
+ early_stopping:
401
+ value: false
402
+ enable_channel_loss:
403
+ value: false
404
+ enable_dft_loss:
405
+ value: false
406
+ enable_flattened_weight_sync:
407
+ value: true
408
+ encoder_no_repeat_ngram_size:
409
+ value: 0
410
+ eos_token_id:
411
+ value: 151645
412
+ epsilon:
413
+ value: 0.2
414
+ epsilon_high:
415
+ value: 0.28
416
+ eval_accumulation_steps:
417
+ value: null
418
+ eval_dataset:
419
+ value: []
420
+ eval_dataset_args:
421
+ value: null
422
+ eval_delay:
423
+ value: 0
424
+ eval_do_concat_batches:
425
+ value: true
426
+ eval_generation_config:
427
+ value: null
428
+ eval_limit:
429
+ value: null
430
+ eval_metric:
431
+ value: null
432
+ eval_on_start:
433
+ value: false
434
+ eval_steps:
435
+ value: 20
436
+ eval_strategy:
437
+ value: steps
438
+ eval_use_evalscope:
439
+ value: false
440
+ eval_use_gather_object:
441
+ value: false
442
+ exponential_decay_length_penalty:
443
+ value: null
444
+ extra_eval_args:
445
+ value: null
446
+ finetuning_task:
447
+ value: null
448
+ forced_bos_token_id:
449
+ value: null
450
+ forced_eos_token_id:
451
+ value: null
452
+ fp16:
453
+ value: false
454
+ fp16_backend:
455
+ value: auto
456
+ fp16_full_eval:
457
+ value: false
458
+ fp16_opt_level:
459
+ value: O1
460
+ fsdp:
461
+ value: []
462
+ fsdp_config:
463
+ value:
464
+ min_num_params: 0
465
+ xla: false
466
+ xla_fsdp_grad_ckpt: false
467
+ xla_fsdp_v2: false
468
+ fsdp_min_num_params:
469
+ value: 0
470
+ fsdp_transformer_layer_cls_to_wrap:
471
+ value: null
472
+ full_determinism:
473
+ value: false
474
+ galore_cos_threshold:
475
+ value: 0.4
476
+ galore_gamma_proj:
477
+ value: 2
478
+ galore_optim_per_parameter:
479
+ value: false
480
+ galore_proj_bits:
481
+ value: 4
482
+ galore_proj_group_size:
483
+ value: 256
484
+ galore_proj_quant:
485
+ value: false
486
+ galore_proj_type:
487
+ value: std
488
+ galore_quantization:
489
+ value: false
490
+ galore_queue_size:
491
+ value: 5
492
+ galore_rank:
493
+ value: 128
494
+ galore_scale:
495
+ value: 1
496
+ galore_target_modules:
497
+ value: null
498
+ galore_update_proj_gap:
499
+ value: 50
500
+ galore_with_embedding:
501
+ value: false
502
+ generation_batch_size:
503
+ value: 48
504
+ generation_kwargs:
505
+ value: null
506
+ gradient_accumulation_steps:
507
+ value: 12
508
+ gradient_checkpointing:
509
+ value: false
510
+ gradient_checkpointing_kwargs:
511
+ value: null
512
+ greater_is_better:
513
+ value: false
514
+ group_by_length:
515
+ value: false
516
+ half_precision_backend:
517
+ value: auto
518
+ hub_always_push:
519
+ value: false
520
+ hub_model_id:
521
+ value: null
522
+ hub_private_repo:
523
+ value: null
524
+ hub_revision:
525
+ value: null
526
+ hub_strategy:
527
+ value: every_save
528
+ hub_token:
529
+ value: <HUB_TOKEN>
530
+ id2label:
531
+ value:
532
+ "0": LABEL_0
533
+ "1": LABEL_1
534
+ ignore_data_skip:
535
+ value: false
536
+ importance_sampling_level:
537
+ value: token
538
+ include_for_metrics:
539
+ value: []
540
+ include_inputs_for_metrics:
541
+ value: false
542
+ include_num_input_tokens_seen:
543
+ value: "no"
544
+ include_tokens_per_second:
545
+ value: false
546
+ is_decoder:
547
+ value: false
548
+ is_encoder_decoder:
549
+ value: false
550
+ jit_mode_eval:
551
+ value: false
552
+ kl_in_reward:
553
+ value: false
554
+ label_names:
555
+ value: null
556
+ label_smoothing_factor:
557
+ value: 0
558
+ label2id:
559
+ value:
560
+ LABEL_0: 0
561
+ LABEL_1: 1
562
+ learning_rate:
563
+ value: 5e-05
564
+ length_column_name:
565
+ value: length
566
+ length_penalty:
567
+ value: 1
568
+ liger_kernel_config:
569
+ value: null
570
+ lisa_activated_layers:
571
+ value: 0
572
+ lisa_step_interval:
573
+ value: 20
574
+ load_best_model_at_end:
575
+ value: false
576
+ local_rank:
577
+ value: 0
578
+ log_completions:
579
+ value: true
580
+ log_completions_hub_repo:
581
+ value: null
582
+ log_entropy:
583
+ value: false
584
+ log_level:
585
+ value: passive
586
+ log_level_replica:
587
+ value: warning
588
+ log_on_each_node:
589
+ value: true
590
+ log_rollout_offpolicy_metrics:
591
+ value: false
592
+ log_unique_prompts:
593
+ value: false
594
+ logging_dir:
595
+ value: /mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/0416upload/out/qwen3asr_dapo_reward56_4x4x12_12gen_4GPU/v3-20260417-123227/runs
596
+ logging_first_step:
597
+ value: true
598
+ logging_nan_inf_filter:
599
+ value: true
600
+ logging_steps:
601
+ value: 5
602
+ logging_strategy:
603
+ value: steps
604
+ lora_rank:
605
+ value: 8
606
+ loss_type:
607
+ value: dapo
608
+ lr_scheduler_kwargs:
609
+ value: null
610
+ lr_scheduler_type:
611
+ value: cosine
612
+ mask_truncated_completions:
613
+ value: false
614
+ max_completion_length:
615
+ value: 256
616
+ max_epochs:
617
+ value: null
618
+ max_grad_norm:
619
+ value: 1
620
+ max_length:
621
+ value: 20
622
+ max_resample_times:
623
+ value: 4
624
+ max_shard_size:
625
+ value: 5GB
626
+ max_steps:
627
+ value: -1
628
+ max_tool_calling_iterations:
629
+ value: null
630
+ max_turns:
631
+ value: null
632
+ metric_for_best_model:
633
+ value: loss
634
+ min_length:
635
+ value: 0
636
+ min_p:
637
+ value: null
638
+ model/num_parameters:
639
+ value: 2050307712
640
+ model_init_kwargs:
641
+ value: null
642
+ model_type:
643
+ value: qwen3_asr
644
+ move_model_batches:
645
+ value: null
646
+ mp_parameters:
647
+ value: ""
648
+ multi_objective_aggregation:
649
+ value: sum_then_normalize
650
+ multi_turn_scheduler:
651
+ value: null
652
+ neftune_noise_alpha:
653
+ value: null
654
+ no_cuda:
655
+ value: false
656
+ no_repeat_ngram_size:
657
+ value: 0
658
+ num_beam_groups:
659
+ value: 1
660
+ num_beams:
661
+ value: 1
662
+ num_completions_to_print:
663
+ value: null
664
+ num_generations:
665
+ value: 12
666
+ num_generations_eval:
667
+ value: 4
668
+ num_iterations:
669
+ value: 2
670
+ num_return_sequences:
671
+ value: 1
672
+ num_train_epochs:
673
+ value: 3
674
+ off_policy_mask_threshold:
675
+ value: null
676
+ off_policy_sequence_mask_delta:
677
+ value: null
678
+ offload_model:
679
+ value: false
680
+ offload_optimizer:
681
+ value: false
682
+ optim:
683
+ value: adamw_torch
684
+ optim_args:
685
+ value: null
686
+ optim_target_modules:
687
+ value: null
688
+ optimizer:
689
+ value: null
690
+ output_attentions:
691
+ value: false
692
+ output_dir:
693
+ value: /mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/0416upload/out/qwen3asr_dapo_reward56_4x4x12_12gen_4GPU/v3-20260417-123227
694
+ output_hidden_states:
695
+ value: false
696
+ output_scores:
697
+ value: false
698
+ overlong_filter:
699
+ value: true
700
+ overwrite_output_dir:
701
+ value: false
702
+ pad_token_id:
703
+ value: 151643
704
+ parallelism_config:
705
+ value: null
706
+ past_index:
707
+ value: -1
708
+ peft_config:
709
+ value:
710
+ default:
711
+ alora_invocation_tokens: null
712
+ arrow_config: null
713
+ auto_mapping: null
714
+ base_model_name_or_path: /mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/qwen3-asr-merged
715
+ bias: none
716
+ corda_config: null
717
+ ensure_weight_tying: false
718
+ eva_config: null
719
+ exclude_modules: null
720
+ fan_in_fan_out: false
721
+ inference_mode: false
722
+ init_lora_weights: true
723
+ layer_replication: null
724
+ layers_pattern: null
725
+ layers_to_transform: null
726
+ lora_alpha: 32
727
+ lora_bias: false
728
+ lora_dropout: 0.05
729
+ lora_dtype: null
730
+ lorap_emb_lr: 1e-06
731
+ lorap_lr_ratio: null
732
+ megatron_config: null
733
+ megatron_core: megatron.core
734
+ modules_to_save: []
735
+ peft_type: LORA
736
+ peft_version: 0.18.1
737
+ qalora_group_size: 16
738
+ r: 8
739
+ revision: null
740
+ runtime_config:
741
+ ephemeral_gpu_offload: false
742
+ target_modules: ^(thinker\.model(?=\.).*\.(up_proj|v_proj|k_proj|o_proj|q_proj|gate_proj|down_proj)|thinker\.audio_tower\.layers(?=\.).*\.(v_proj|fc2|k_proj|fc1|q_proj|out_proj)|thinker\.audio_tower\.conv_out(?=\.)|thinker\.audio_tower\.proj1(?=\.)|thinker\.audio_tower\.proj2(?=\.))$
743
+ target_parameters: null
744
+ task_type: CAUSAL_LM
745
+ trainable_token_indices: null
746
+ use_dora: false
747
+ use_qalora: false
748
+ use_rslora: false
749
+ per_device_eval_batch_size:
750
+ value: 8
751
+ per_device_train_batch_size:
752
+ value: 8
753
+ per_gpu_eval_batch_size:
754
+ value: null
755
+ per_gpu_train_batch_size:
756
+ value: null
757
+ prediction_loss_only:
758
+ value: false
759
+ prefix:
760
+ value: null
761
+ problem_type:
762
+ value: null
763
+ project:
764
+ value: huggingface
765
+ push_to_hub:
766
+ value: false
767
+ push_to_hub_model_id:
768
+ value: null
769
+ push_to_hub_organization:
770
+ value: null
771
+ push_to_hub_token:
772
+ value: <PUSH_TO_HUB_TOKEN>
773
+ ray_scope:
774
+ value: last
775
+ ref_model_mixup_alpha:
776
+ value: 0.6
777
+ ref_model_sync_steps:
778
+ value: 512
779
+ remove_invalid_values:
780
+ value: false
781
+ remove_unused_columns:
782
+ value: false
783
+ repetition_max_penalty:
784
+ value: -1
785
+ repetition_n_grams:
786
+ value: 3
787
+ repetition_penalty:
788
+ value: 1.08
789
+ report_to:
790
+ value:
791
+ - wandb
792
+ restore_callback_states_from_checkpoint:
793
+ value: false
794
+ resume_from_checkpoint:
795
+ value: null
796
+ resume_only_model:
797
+ value: false
798
+ return_dict:
799
+ value: true
800
+ return_dict_in_generate:
801
+ value: false
802
+ reward_model:
803
+ value: null
804
+ reward_model_plugin:
805
+ value: null
806
+ reward_weights:
807
+ value: null
808
+ rollout_importance_sampling_mode:
809
+ value: null
810
+ rollout_importance_sampling_threshold:
811
+ value: 2
812
+ router_aux_loss_coef:
813
+ value: 0
814
+ run_name:
815
+ value: qwen3asr_dapo_reward56_4x4x12_12gen_4GPU
816
+ safe_serialization:
817
+ value: true
818
+ sapo_temperature_neg:
819
+ value: 1.05
820
+ sapo_temperature_pos:
821
+ value: 1
822
+ save_on_each_node:
823
+ value: false
824
+ save_only_model:
825
+ value: false
826
+ save_safetensors:
827
+ value: true
828
+ save_steps:
829
+ value: 20
830
+ save_strategy:
831
+ value: steps
832
+ save_total_limit:
833
+ value: null
834
+ scale_rewards:
835
+ value: group
836
+ seed:
837
+ value: 42
838
+ sep_token_id:
839
+ value: null
840
+ shuffle_dataset:
841
+ value: true
842
+ skip_memory_metrics:
843
+ value: true
844
+ sleep_level:
845
+ value: 0
846
+ soft_cache_length:
847
+ value: null
848
+ soft_max_length:
849
+ value: null
850
+ steps_per_generation:
851
+ value: 3
852
+ stop_words:
853
+ value: []
854
+ structured_outputs_regex:
855
+ value: null
856
+ support_languages:
857
+ value:
858
+ - Chinese
859
+ - English
860
+ - Cantonese
861
+ - Arabic
862
+ - German
863
+ - French
864
+ - Spanish
865
+ - Portuguese
866
+ - Indonesian
867
+ - Italian
868
+ - Korean
869
+ - Russian
870
+ - Thai
871
+ - Vietnamese
872
+ - Japanese
873
+ - Turkish
874
+ - Hindi
875
+ - Malay
876
+ - Dutch
877
+ - Swedish
878
+ - Danish
879
+ - Finnish
880
+ - Polish
881
+ - Czech
882
+ - Filipino
883
+ - Persian
884
+ - Greek
885
+ - Romanian
886
+ - Hungarian
887
+ - Macedonian
888
+ suppress_tokens:
889
+ value: null
890
+ sync_ref_model:
891
+ value: false
892
+ task_specific_params:
893
+ value: null
894
+ tau_neg:
895
+ value: 1.05
896
+ tau_pos:
897
+ value: 1
898
+ temperature:
899
+ value: 0.5
900
+ tf_legacy_loss:
901
+ value: false
902
+ tf32:
903
+ value: null
904
+ thinker_config:
905
+ value:
906
+ _name_or_path: ""
907
+ add_cross_attention: false
908
+ architectures:
909
+ - Qwen3ASRForConditionalGeneration
910
+ audio_config:
911
+ _name_or_path: ""
912
+ activation_dropout: 0
913
+ activation_function: gelu
914
+ add_cross_attention: false
915
+ architectures: null
916
+ attention_dropout: 0
917
+ bad_words_ids: null
918
+ begin_suppress_tokens: null
919
+ bos_token_id: null
920
+ chunk_size_feed_forward: 0
921
+ conv_chunksize: 500
922
+ cross_attention_hidden_size: null
923
+ d_model: 1024
924
+ decoder_start_token_id: null
925
+ diversity_penalty: 0
926
+ do_sample: false
927
+ downsample_hidden_size: 480
928
+ dropout: 0
929
+ dtype: null
930
+ early_stopping: false
931
+ encoder_attention_heads: 16
932
+ encoder_ffn_dim: 4096
933
+ encoder_layers: 24
934
+ encoder_no_repeat_ngram_size: 0
935
+ eos_token_id: null
936
+ exponential_decay_length_penalty: null
937
+ finetuning_task: null
938
+ forced_bos_token_id: null
939
+ forced_eos_token_id: null
940
+ id2label:
941
+ "0": LABEL_0
942
+ "1": LABEL_1
943
+ initializer_range: 0.02
944
+ is_decoder: false
945
+ is_encoder_decoder: false
946
+ label2id:
947
+ LABEL_0: 0
948
+ LABEL_1: 1
949
+ length_penalty: 1
950
+ max_length: 20
951
+ max_source_positions: 1500
952
+ min_length: 0
953
+ model_type: qwen3_asr_audio_encoder
954
+ n_window: 50
955
+ n_window_infer: 800
956
+ no_repeat_ngram_size: 0
957
+ num_beam_groups: 1
958
+ num_beams: 1
959
+ num_hidden_layers: 24
960
+ num_mel_bins: 128
961
+ num_return_sequences: 1
962
+ output_attentions: false
963
+ output_dim: 2048
964
+ output_hidden_states: false
965
+ output_scores: false
966
+ pad_token_id: null
967
+ prefix: null
968
+ problem_type: null
969
+ remove_invalid_values: false
970
+ repetition_penalty: 1
971
+ return_dict: true
972
+ return_dict_in_generate: false
973
+ scale_embedding: false
974
+ sep_token_id: null
975
+ suppress_tokens: null
976
+ task_specific_params: null
977
+ temperature: 1
978
+ tf_legacy_loss: false
979
+ tie_encoder_decoder: false
980
+ tie_word_embeddings: true
981
+ tokenizer_class: null
982
+ top_k: 50
983
+ top_p: 1
984
+ torchscript: false
985
+ typical_p: 1
986
+ use_bfloat16: false
987
+ audio_end_token_id: 151670
988
+ audio_start_token_id: 151669
989
+ audio_token_id: 151676
990
+ bad_words_ids: null
991
+ begin_suppress_tokens: null
992
+ bos_token_id: null
993
+ chunk_size_feed_forward: 0
994
+ cross_attention_hidden_size: null
995
+ decoder_start_token_id: null
996
+ diversity_penalty: 0
997
+ do_sample: false
998
+ dtype: bfloat16
999
+ early_stopping: false
1000
+ encoder_no_repeat_ngram_size: 0
1001
+ eos_token_id: null
1002
+ exponential_decay_length_penalty: null
1003
+ finetuning_task: null
1004
+ forced_bos_token_id: null
1005
+ forced_eos_token_id: null
1006
+ id2label:
1007
+ "0": LABEL_0
1008
+ "1": LABEL_1
1009
+ initializer_range: 0.02
1010
+ is_decoder: false
1011
+ is_encoder_decoder: false
1012
+ label2id:
1013
+ LABEL_0: 0
1014
+ LABEL_1: 1
1015
+ length_penalty: 1
1016
+ max_length: 20
1017
+ min_length: 0
1018
+ model_type: qwen3_asr_thinker
1019
+ no_repeat_ngram_size: 0
1020
+ num_beam_groups: 1
1021
+ num_beams: 1
1022
+ num_return_sequences: 1
1023
+ output_attentions: false
1024
+ output_hidden_states: false
1025
+ output_scores: false
1026
+ pad_token_id: null
1027
+ prefix: null
1028
+ problem_type: null
1029
+ remove_invalid_values: false
1030
+ repetition_penalty: 1
1031
+ return_dict: true
1032
+ return_dict_in_generate: false
1033
+ sep_token_id: null
1034
+ suppress_tokens: null
1035
+ task_specific_params: null
1036
+ temperature: 1
1037
+ text_config:
1038
+ _name_or_path: ""
1039
+ add_cross_attention: false
1040
+ architectures: null
1041
+ attention_bias: false
1042
+ attention_dropout: 0
1043
+ bad_words_ids: null
1044
+ begin_suppress_tokens: null
1045
+ bos_token_id: null
1046
+ chunk_size_feed_forward: 0
1047
+ cross_attention_hidden_size: null
1048
+ decoder_start_token_id: null
1049
+ diversity_penalty: 0
1050
+ do_sample: false
1051
+ dtype: null
1052
+ early_stopping: false
1053
+ encoder_no_repeat_ngram_size: 0
1054
+ eos_token_id: null
1055
+ exponential_decay_length_penalty: null
1056
+ finetuning_task: null
1057
+ forced_bos_token_id: null
1058
+ forced_eos_token_id: null
1059
+ head_dim: 128
1060
+ hidden_act: silu
1061
+ hidden_size: 2048
1062
+ id2label:
1063
+ "0": LABEL_0
1064
+ "1": LABEL_1
1065
+ initializer_range: 0.02
1066
+ intermediate_size: 6144
1067
+ is_decoder: false
1068
+ is_encoder_decoder: false
1069
+ label2id:
1070
+ LABEL_0: 0
1071
+ LABEL_1: 1
1072
+ length_penalty: 1
1073
+ max_length: 20
1074
+ max_position_embeddings: 65536
1075
+ min_length: 0
1076
+ model_type: qwen3_asr_text
1077
+ no_repeat_ngram_size: 0
1078
+ num_attention_heads: 16
1079
+ num_beam_groups: 1
1080
+ num_beams: 1
1081
+ num_hidden_layers: 28
1082
+ num_key_value_heads: 8
1083
+ num_return_sequences: 1
1084
+ output_attentions: false
1085
+ output_hidden_states: false
1086
+ output_scores: false
1087
+ pad_token_id: 151643
1088
+ prefix: null
1089
+ problem_type: null
1090
+ remove_invalid_values: false
1091
+ repetition_penalty: 1
1092
+ return_dict: true
1093
+ return_dict_in_generate: false
1094
+ rms_norm_eps: 1e-06
1095
+ rope_scaling:
1096
+ interleaved: true
1097
+ mrope_interleaved: true
1098
+ mrope_section:
1099
+ - 24
1100
+ - 20
1101
+ - 20
1102
+ rope_type: default
1103
+ type: default
1104
+ rope_theta: 1000000
1105
+ sep_token_id: null
1106
+ suppress_tokens: null
1107
+ task_specific_params: null
1108
+ temperature: 1
1109
+ tf_legacy_loss: false
1110
+ tie_encoder_decoder: false
1111
+ tie_word_embeddings: true
1112
+ tokenizer_class: null
1113
+ top_k: 50
1114
+ top_p: 1
1115
+ torchscript: false
1116
+ typical_p: 1
1117
+ use_bfloat16: false
1118
+ use_cache: false
1119
+ vocab_size: 151936
1120
+ tf_legacy_loss: false
1121
+ tie_encoder_decoder: false
1122
+ tie_word_embeddings: true
1123
+ tokenizer_class: null
1124
+ top_k: 50
1125
+ top_p: 1
1126
+ torchscript: false
1127
+ typical_p: 1
1128
+ use_bfloat16: false
1129
+ user_token_id: 872
1130
+ tie_encoder_decoder:
1131
+ value: false
1132
+ tie_word_embeddings:
1133
+ value: true
1134
+ tokenizer_class:
1135
+ value: null
1136
+ top_entropy_quantile:
1137
+ value: 1
1138
+ top_k:
1139
+ value: 50
1140
+ top_p:
1141
+ value: 0.95
1142
+ torch_compile:
1143
+ value: false
1144
+ torch_compile_backend:
1145
+ value: null
1146
+ torch_compile_mode:
1147
+ value: null
1148
+ torch_empty_cache_steps:
1149
+ value: null
1150
+ torchdynamo:
1151
+ value: null
1152
+ torchscript:
1153
+ value: false
1154
+ tpu_metrics_debug:
1155
+ value: false
1156
+ tpu_num_cores:
1157
+ value: null
1158
+ trackio_space_id:
1159
+ value: trackio
1160
+ train_dataloader_shuffle:
1161
+ value: true
1162
+ transformers_version:
1163
+ value: 4.57.6
1164
+ tuner_backend:
1165
+ value: peft
1166
+ tuner_type:
1167
+ value: lora
1168
+ typical_p:
1169
+ value: 1
1170
+ use_bfloat16:
1171
+ value: false
1172
+ use_bias_correction_kl:
1173
+ value: false
1174
+ use_cpu:
1175
+ value: false
1176
+ use_flash_ckpt:
1177
+ value: false
1178
+ use_galore:
1179
+ value: false
1180
+ use_legacy_prediction_loop:
1181
+ value: false
1182
+ use_liger_kernel:
1183
+ value: false
1184
+ use_logits_to_keep:
1185
+ value: null
1186
+ use_mps_device:
1187
+ value: false
1188
+ use_transformers_paged:
1189
+ value: false
1190
+ use_vllm:
1191
+ value: false
1192
+ vit_gradient_checkpointing:
1193
+ value: true
1194
+ vit_lr:
1195
+ value: null
1196
+ vllm_data_parallel_size:
1197
+ value: 1
1198
+ vllm_disable_cascade_attn:
1199
+ value: false
1200
+ vllm_disable_custom_all_reduce:
1201
+ value: true
1202
+ vllm_enable_expert_parallel:
1203
+ value: false
1204
+ vllm_enable_lora:
1205
+ value: false
1206
+ vllm_enable_prefix_caching:
1207
+ value: true
1208
+ vllm_enable_sleep_mode:
1209
+ value: false
1210
+ vllm_enforce_eager:
1211
+ value: false
1212
+ vllm_gpu_memory_utilization:
1213
+ value: 0.9
1214
+ vllm_group_port:
1215
+ value: 51216
1216
+ vllm_importance_sampling_cap:
1217
+ value: 3
1218
+ vllm_importance_sampling_correction:
1219
+ value: true
1220
+ vllm_importance_sampling_mode:
1221
+ value: sequence_mask
1222
+ vllm_limit_mm_per_prompt:
1223
+ value: null
1224
+ vllm_max_lora_rank:
1225
+ value: 16
1226
+ vllm_max_model_len:
1227
+ value: null
1228
+ vllm_max_model_length:
1229
+ value: null
1230
+ vllm_max_num_seqs:
1231
+ value: null
1232
+ vllm_mm_processor_cache_gb:
1233
+ value: null
1234
+ vllm_mode:
1235
+ value: null
1236
+ vllm_model_impl:
1237
+ value: vllm
1238
+ vllm_pipeline_parallel_size:
1239
+ value: 1
1240
+ vllm_quantization:
1241
+ value: null
1242
+ vllm_reasoning_parser:
1243
+ value: null
1244
+ vllm_server_base_url:
1245
+ value: null
1246
+ vllm_server_group_port:
1247
+ value: null
1248
+ vllm_server_host:
1249
+ value: null
1250
+ vllm_server_pass_dataset:
1251
+ value: false
1252
+ vllm_server_port:
1253
+ value:
1254
+ - 8000
1255
+ vllm_server_timeout:
1256
+ value: 240
1257
+ vllm_speculative_config:
1258
+ value: null
1259
+ vllm_structured_outputs_regex:
1260
+ value: null
1261
+ vllm_tensor_parallel_size:
1262
+ value: 1
1263
+ vllm_use_async_engine:
1264
+ value: null
1265
+ wandb_log_unique_prompts:
1266
+ value: null
1267
+ warmup_ratio:
1268
+ value: 0.03
1269
+ warmup_steps:
1270
+ value: 0
1271
+ weight_decay:
1272
+ value: 0.1
wandb/run-20260417_123237-3h84yfea/files/media/table/completions_1_e5129c1db5b8522d8aa7.table.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"columns": ["step", "prompt", "completion", "ASRWerSubLenCmpHalluDirtyV56", "advantages", "solution"], "data": [["1", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>The reverend recteur passed his hand wearily over his brow, a hill with a faint memory of running upstairs so quickly. We never touched the beastly box. The doctor then your competitor did said missus nelly no no said the curate hastily.<|im_end|>", -0.1968451738357544, -0.8322931528091431, "The reverend septimus passed his hand wearily over his brow. I feel a little faint, he said, running upstairs so quickly, we never touched the beastly box, said robert. Then your confederates did said miss selina. No, no, said the curate hastily."], ["1", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>The reverend rectory passed his hand wearily over his brow a hill and a faint misty morning upstairs, he said we never touched the beastly box then your competitor did said missus nixon no no said the curate hastily.<|im_end|>", -0.37275323271751404, -2.000243663787842, "The reverend septimus passed his hand wearily over his brow. I feel a little faint, he said, running upstairs so quickly, we never touched the beastly box, said robert. Then your confederates did said miss selina. No, no, said the curate hastily."], ["1", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>The reverend recteur passed his hand wearily over his brow a hill wind of faintness has been running upstairs so lately, we never touched the beastly box said the vicar then your competitor did said missus neil no no said the curate hastily.<|im_end|>", -0.174954354763031, -0.6869479417800903, "The reverend septimus passed his hand wearily over his brow. I feel a little faint, he said, running upstairs so quickly, we never touched the beastly box, said robert. Then your confederates did said miss selina. No, no, said the curate hastily."], ["1", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>The reverend recteur passed his hand wearily over his brow, a hillwood of faintness and running upstairs so quickly we never touched the beastly box said the vicar then your competitor's did said missus nelly no no said the curate hastily.<|im_end|>", -0.06302247941493988, 0.056229472160339355, "The reverend septimus passed his hand wearily over his brow. I feel a little faint, he said, running upstairs so quickly, we never touched the beastly box, said robert. Then your confederates did said miss selina. No, no, said the curate hastily."], ["1", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>The reverend rectors passed his hand wearily over his brow, I feel a little faint now for running upstairs so quickly. We never touched the beastly box said morris then your competitor did said missus merrithew no, no said the curate hastily.<|im_end|>", 0.24413266777992249, 2.0956015586853027, "The reverend septimus passed his hand wearily over his brow. I feel a little faint, he said, running upstairs so quickly, we never touched the beastly box, said robert. Then your confederates did said miss selina. No, no, said the curate hastily."], ["1", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>The reverend recteur passed his hand wearily over his brow a hill with a fainting man running upstairs so quickly, we never touched the beastly box said Robert and your competitor did said missus minton no no said the curate hastily.<|im_end|>", -0.09589200466871262, -0.16200941801071167, "The reverend septimus passed his hand wearily over his brow. I feel a little faint, he said, running upstairs so quickly, we never touched the beastly box, said robert. Then your confederates did said miss selina. No, no, said the curate hastily."], ["1", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>The reverend recteur passed his hand wearily over his brow a hill with a faint memory of running upstairs so quickly, we never touched the beastly box said the curate and your confederates did said missus mallet no no said the curate hastily.<|im_end|>", -0.09384658932685852, -0.1484287828207016, "The reverend septimus passed his hand wearily over his brow. I feel a little faint, he said, running upstairs so quickly, we never touched the beastly box, said robert. Then your confederates did said miss selina. No, no, said the curate hastily."], ["1", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>The reverend rectors passed his hand wearily over his brow a hill of saint nicholas went upstairs so quickly, we never touched the beastly box said robert then your competitor did said missus mink no no said the curate hastily.<|im_end|>", -0.005024942569434643, 0.44130709767341614, "The reverend septimus passed his hand wearily over his brow. I feel a little faint, he said, running upstairs so quickly, we never touched the beastly box, said robert. Then your confederates did said miss selina. No, no, said the curate hastily."], ["1", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>The reverend rectory passed his hand wearily over his brow a hillwood saint may be running upstairs so briskly, we never touched the beastly box said the curate and your competitor did said missus nelly no no said the curate hastily.<|im_end|>", -0.13762426376342773, -0.43909287452697754, "The reverend septimus passed his hand wearily over his brow. I feel a little faint, he said, running upstairs so quickly, we never touched the beastly box, said robert. Then your confederates did said miss selina. No, no, said the curate hastily."], ["1", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>The reverend recteur passed his hand wearily over his brow, I feel a little faint now that I am upstairs so quickly. We never touched the beastly box either than your competitor did said missus nelly no, no said the curate hastily.<|im_end|>", -0.004176640883088112, 0.4469394385814667, "The reverend septimus passed his hand wearily over his brow. I feel a little faint, he said, running upstairs so quickly, we never touched the beastly box, said robert. Then your confederates did said miss selina. No, no, said the curate hastily."], ["1", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>The reverend recteur passed his hand wearily over his brow a hill with a faint memory of running upstairs so quickly we never touched the beastly box said robert then your competitor did said missus nunn no, no, said the curate hastily.<|im_end|>", 0.04079977795481682, 0.7455626726150513, "The reverend septimus passed his hand wearily over his brow. I feel a little faint, he said, running upstairs so quickly, we never touched the beastly box, said robert. Then your confederates did said miss selina. No, no, said the curate hastily."], ["1", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>The reverend recteur passed his hand wearily over his brow a hill of faintness and running upstairs so quickly, we never touched the beastly box said robert then your competitor did said missus innes no no said the curate hastily<|im_end|>", 0.001311193685978651, 0.483376145362854, "The reverend septimus passed his hand wearily over his brow. I feel a little faint, he said, running upstairs so quickly, we never touched the beastly box, said robert. Then your confederates did said miss selina. No, no, said the curate hastily."], ["1", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>There was much amazement spread among her sister, that political aspects of the revolution in france changed almost every day she might not understand how his own views and sympathies might often modify them.<|im_end|>", -0.10891497135162354, -2.1773321628570557, "There was much armand saint just could not tell his sister the political aspect of the revolution in france was changing almost every day. She might not understand how his own views and sympathies might become modified."], ["1", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>There was much armagogy for my cousin's sister, the political aspect of the revolution in france changing almost every day. She might not understand how his own views and sympathies might be modified.<|im_end|>", 0.3462296724319458, 1.5272533893585205, "There was much armand saint just could not tell his sister the political aspect of the revolution in france was changing almost every day. She might not understand how his own views and sympathies might become modified."], ["1", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>There was much armagnac jokes with my cousin sister, the political aspect of the revolution in france changing almost every day she might not understand how his own views and sympathies might differ from mine.<|im_end|>", 0.11626709252595901, -0.34449443221092224, "There was much armand saint just could not tell his sister the political aspect of the revolution in france was changing almost every day. She might not understand how his own views and sympathies might become modified."], ["1", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>There was much armagnac jokes with my cousin sister, the political aspect of the revolution in france changing almost every day. She might not understand how his own views and sympathies might often modify.<|im_end|>", 0.257978618144989, 0.808946430683136, "There was much armand saint just could not tell his sister the political aspect of the revolution in france was changing almost every day. She might not understand how his own views and sympathies might become modified."], ["1", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>There was much amaranteuse about Parisian society, the political aspect of the revolution in France changing almost every day. She might not understand how his own views and sympathies might often modify her.<|im_end|>", 0.21243521571159363, 0.43825238943099976, "There was much armand saint just could not tell his sister the political aspect of the revolution in france was changing almost every day. She might not understand how his own views and sympathies might become modified."], ["1", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>There was much armagnac, jute and martell in his drink. The political aspect of the revolution is hence changing almost every day. She might not understand how his own views and sympathies might often modify it.<|im_end|>", 0.10369522124528885, -0.4468214213848114, "There was much armand saint just could not tell his sister the political aspect of the revolution in france was changing almost every day. She might not understand how his own views and sympathies might become modified."], ["1", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>There was much armaghajet for my cousin sister, the political aspect of the revolution in france changing almost every day she might not understand how his own views and sympathies might often modify them.<|im_end|>", 0.13262253999710083, -0.21137160062789917, "There was much armand saint just could not tell his sister the political aspect of the revolution in france was changing almost every day. She might not understand how his own views and sympathies might become modified."], ["1", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>There was much amarante jute for my traveling sister, the political aspect of the revolution in france changing almost every day she might not understand how his own views and sympathies might be modified.<|im_end|>", 0.26360028982162476, 0.8547032475471497, "There was much armand saint just could not tell his sister the political aspect of the revolution in france was changing almost every day. She might not understand how his own views and sympathies might become modified."], ["1", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>There was much armagnac yoked to my parent's estate, the political aspect of the revolution of france changing almost every day she might not understand how his own views and sympathies might be modified.<|im_end|>", 0.18032926321029663, 0.1769305318593979, "There was much armand saint just could not tell his sister the political aspect of the revolution in france was changing almost every day. She might not understand how his own views and sympathies might become modified."], ["1", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>There was much armance and jocund merrymaking there, but the political aspect of the revolution is hence changing almost every day. She might not understand how his own views and sympathies might often modify hers.<|im_end|>", 0.033820733428001404, -1.0155549049377441, "There was much armand saint just could not tell his sister the political aspect of the revolution in france was changing almost every day. She might not understand how his own views and sympathies might become modified."], ["1", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>There was much arme hautes in my town, sister. The political aspect of the revolution is hence changing almost every day. She might not understand how his own views and sympathies might often modify.<|im_end|>", 0.10335493087768555, -0.44959115982055664, "There was much armand saint just could not tell his sister the political aspect of the revolution in france was changing almost every day. She might not understand how his own views and sympathies might become modified."], ["1", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>There was much amazement spread among her sister, the political aspect of the revolution in france changing almost every day. She might not understand how his own views and sympathies might often modify.<|im_end|>", 0.26168063282966614, 0.8390784859657288, "There was much armand saint just could not tell his sister the political aspect of the revolution in france was changing almost every day. She might not understand how his own views and sympathies might become modified."], ["1", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Never prior to a public meeting that the order should be payable in any year and do bear interest of five per cent if these orders were disposed of provisionally at least would be purchased he seconded with very little hesitation adopted both orders were immediately printed<|im_end|>", -0.32611703872680664, -0.7204017639160156, "and therefore i propos'd that the orders should be payable in a year and to bear an interest of five per cent with these orders i suppos'd the provisions might easily be purchas'd the assembly with very little hesitation adopted the proposal the orders were immediately printed"], ["1", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Never provided for both that the order should be payable in any and do bearing interest of five per cent if these orders were to suppose provisions might easily be purchased is now with very little hesitation adopted both orders were immediately printed.<|im_end|>", -0.15472601354122162, 0.3779638409614563, "and therefore i propos'd that the orders should be payable in a year and to bear an interest of five per cent with these orders i suppos'd the provisions might easily be purchas'd the assembly with very little hesitation adopted the proposal the orders were immediately printed"], ["1", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Never prior to public opinion that the order should be payable in a year and do bear an interest of five per cent if these orders were disposed of provisionally at least would be purchased he said with very little hesitation adopting both orders were immediately printed.<|im_end|>", -0.28605878353118896, -0.4636869728565216, "and therefore i propos'd that the orders should be payable in a year and to bear an interest of five per cent with these orders i suppos'd the provisions might easily be purchas'd the assembly with very little hesitation adopted the proposal the orders were immediately printed"], ["1", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Never prior, but once that they ordered it should be payable in England and do bear an interest of five per cent if these orders were disposed of provisionally at least would be purchased he said with very little hesitation adopted both orders were immediately printed.<|im_end|>", -0.4090765416622162, -1.252050757408142, "and therefore i propos'd that the orders should be payable in a year and to bear an interest of five per cent with these orders i suppos'd the provisions might easily be purchas'd the assembly with very little hesitation adopted the proposal the orders were immediately printed"], ["1", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Never cried out boldly that the order should be payable in England and do bearing interest five per cent, if these orders were disposed of provisionally at least would be purchased. His nephew with very little hesitation adopted both orders were immediately printed.<|im_end|>", -0.5401909947395325, -2.0923023223876953, "and therefore i propos'd that the orders should be payable in a year and to bear an interest of five per cent with these orders i suppos'd the provisions might easily be purchas'd the assembly with very little hesitation adopted the proposal the orders were immediately printed"], ["1", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Never, prior to published that they ordered it should be payable in a year and do bear an interest of five per cent if these orders were disposed of provisions might easily be purchased he snapped with very little hesitation adopted both orders were immediately printed.<|im_end|>", -0.031015297397971153, 1.1707684993743896, "and therefore i propos'd that the orders should be payable in a year and to bear an interest of five per cent with these orders i suppos'd the provisions might easily be purchas'd the assembly with very little hesitation adopted the proposal the orders were immediately printed"], ["1", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Never prior to public debate that the order should be payable in any year and to bear an interest of five per cent, if these orders were supposed provisionists might easily be purchased. His cabinet with very little hesitation adopted both orders were immediately granted.<|im_end|>", -0.08785741031169891, 0.8064936995506287, "and therefore i propos'd that the orders should be payable in a year and to bear an interest of five per cent with these orders i suppos'd the provisions might easily be purchas'd the assembly with very little hesitation adopted the proposal the orders were immediately printed"], ["1", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Never prior to public opinion that the order should be payable in England and do bear an interest of five per cent if these orders were supposed provisionally easy to be purchased, this act with very little hesitation adopted them both orders were immediately printed.<|im_end|>", -0.2863375246524811, -0.4654732942581177, "and therefore i propos'd that the orders should be payable in a year and to bear an interest of five per cent with these orders i suppos'd the provisions might easily be purchas'd the assembly with very little hesitation adopted the proposal the orders were immediately printed"], ["1", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Never, privateer boat. That they ordered should be payable in England and do bear interest of five per cent that these orders might suppose the provisions might easily be purchased he seconded with very little hesitation adopted both orders were immediately printed.<|im_end|>", -0.09660232812166214, 0.7504515647888184, "and therefore i propos'd that the orders should be payable in a year and to bear an interest of five per cent with these orders i suppos'd the provisions might easily be purchas'd the assembly with very little hesitation adopted the proposal the orders were immediately printed"], ["1", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Never, prior or above that they ordered should be payable in a year and to bear an interest of five per cent if these orders were disposed of provisionally at least would be purchased his nephew with very little hesitation adopted both orders were immediately granted<|im_end|>", -0.16866184771060944, 0.28865551948547363, "and therefore i propos'd that the orders should be payable in a year and to bear an interest of five per cent with these orders i suppos'd the provisions might easily be purchas'd the assembly with very little hesitation adopted the proposal the orders were immediately printed"], ["1", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Never prior to published that the order should be payable in any and do bear an interest of five per cent, if these orders were supposed provisions might easily be purchased he seconded with very little hesitation adopted both orders were immediately printed.<|im_end|>", -0.08984959125518799, 0.7937267422676086, "and therefore i propos'd that the orders should be payable in a year and to bear an interest of five per cent with these orders i suppos'd the provisions might easily be purchas'd the assembly with very little hesitation adopted the proposal the orders were immediately printed"], ["1", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Never, prior to public debate that the order should be payable in England and do bear an interest of five per cent. That these orders would suppose the provisions might easily be purchased. His cabinet with very little hesitation adopted both orders were immediately printed.<|im_end|>", -0.08795680850744247, 0.8058566451072693, "and therefore i propos'd that the orders should be payable in a year and to bear an interest of five per cent with these orders i suppos'd the provisions might easily be purchas'd the assembly with very little hesitation adopted the proposal the orders were immediately printed"], ["1", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>As his trumpet blast sounded forth, he said, the free folk of all that hill give a cheap word and warning that they will fight against you when you come. To her own side came back this ringing reply as the knight rode up with many and fierce assailants.<|im_end|>", -0.7235177755355835, -0.37753382325172424, "Herald of arkell. As his trumpet blast sounded before the gate of the citadel, the free lord of arkell here giveth you word and warning that he will fight against you on the morrow. And from the citadel came back this ringing reply, as the knight of leyenburg made answer for his sovereign lady."], ["1", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>As his trumpet blast sounded over the hill, the three lords of alba heard it and warned and warning at him to fight against you on your mountain. From whence he came back this ringing reply as a knightly lord might answer in such a manner.<|im_end|>", -0.7205132842063904, -0.3610304296016693, "Herald of arkell. As his trumpet blast sounded before the gate of the citadel, the free lord of arkell here giveth you word and warning that he will fight against you on the morrow. And from the citadel came back this ringing reply, as the knight of leyenburg made answer for his sovereign lady."], ["1", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>As his trumpet blast sounded over the open field, the three lord larker here give it you word and warning that he will fight against you on your mountain from whence now came back this ringing reply of the knight in yellow with mallet and scimitar in hand.<|im_end|>", -0.4105190336704254, 1.3417396545410156, "Herald of arkell. As his trumpet blast sounded before the gate of the citadel, the free lord of arkell here giveth you word and warning that he will fight against you on the morrow. And from the citadel came back this ringing reply, as the knight of leyenburg made answer for his sovereign lady."], ["1", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>As his trumpet blast sounded in the open air, the three four walked out and he gave a deep wordy warning that he would fight against you when you met him. And from the hill came back this ringing reply as the knight who had but lately entered the city wall.<|im_end|>", -0.6633491516113281, -0.04703306034207344, "Herald of arkell. As his trumpet blast sounded before the gate of the citadel, the free lord of arkell here giveth you word and warning that he will fight against you on the morrow. And from the citadel came back this ringing reply, as the knight of leyenburg made answer for his sovereign lady."], ["1", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>As his trumpet blast sounded over the hills, the three lords of Argor hear give a deep word and warning that they will fight against you when you come. And from these lips came back this ringing reply as the knight who had brought my answer disappeared again.<|im_end|>", -0.533552348613739, 0.6659289002418518, "Herald of arkell. As his trumpet blast sounded before the gate of the citadel, the free lord of arkell here giveth you word and warning that he will fight against you on the morrow. And from the citadel came back this ringing reply, as the knight of leyenburg made answer for his sovereign lady."], ["1", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>As his trumpet blast sounded forth, he said, the three lords of algalhia give a few word and warning that they will fight against you on your mountain when the messenger came back with screaming reply that the knight had been overtaken by the sons of the sea.<|im_end|>", -0.7495418190956116, -0.520481526851654, "Herald of arkell. As his trumpet blast sounded before the gate of the citadel, the free lord of arkell here giveth you word and warning that he will fight against you on the morrow. And from the citadel came back this ringing reply, as the knight of leyenburg made answer for his sovereign lady."], ["1", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>As his trumpet blast sounded forth, he cried, the free folk of all great hill give us your word and warning that you will fight against you no more from whose lips came back this ringing reply as the knight who had brought my answer was singing aloud.<|im_end|>", -0.6600818634033203, -0.029086142778396606, "Herald of arkell. As his trumpet blast sounded before the gate of the citadel, the free lord of arkell here giveth you word and warning that he will fight against you on the morrow. And from the citadel came back this ringing reply, as the knight of leyenburg made answer for his sovereign lady."], ["1", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>As his trumpet blast sounded through the air, he said, the three lords of all that hill give a chief warning warning that he will fight against you when the night is done with my engines and the sun goes down.<|im_end|>", -0.9883988499641418, -1.8325012922286987, "Herald of arkell. As his trumpet blast sounded before the gate of the citadel, the free lord of arkell here giveth you word and warning that he will fight against you on the morrow. And from the citadel came back this ringing reply, as the knight of leyenburg made answer for his sovereign lady."], ["1", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>As his trumpet blast sounded over, he cried, the free born far from here give a cheap word and warning that he will fight against you when you know it, but from the hills came back this ringing reply of the knight who had heard my legend and was singing along.<|im_end|>", -0.6016453504562378, 0.29190027713775635, "Herald of arkell. As his trumpet blast sounded before the gate of the citadel, the free lord of arkell here giveth you word and warning that he will fight against you on the morrow. And from the citadel came back this ringing reply, as the knight of leyenburg made answer for his sovereign lady."], ["1", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>As his trumpet blast sounded forth, he said the three lords of Argyle give a cheap word and warning that they will fight against you on the morrow. From his lips came back this ringing reply as the knight rode up with my lady and her sister in their arms.<|im_end|>", -0.5207002758979797, 0.7365241646766663, "Herald of arkell. As his trumpet blast sounded before the gate of the citadel, the free lord of arkell here giveth you word and warning that he will fight against you on the morrow. And from the citadel came back this ringing reply, as the knight of leyenburg made answer for his sovereign lady."], ["1", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>As his trumpet blast sounded out, he exclaimed, the freeborn flock will hear gibbetty's warning and warn him of a fight against you on the morrow. The horned giant came back with a ringing reply as the knight rode up at my aunt's house in the evening.<|im_end|>", -0.906722903251648, -1.383862853050232, "Herald of arkell. As his trumpet blast sounded before the gate of the citadel, the free lord of arkell here giveth you word and warning that he will fight against you on the morrow. And from the citadel came back this ringing reply, as the knight of leyenburg made answer for his sovereign lady."], ["1", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>As his trumpet blast sounded forth, he said, the free born robber here give a cheap word and warning that he will fight against you on the morrow. From the hill came back this ringing reply of the knight who had but lately entered into the city again.<|im_end|>", -0.3788970112800598, 1.5154365301132202, "Herald of arkell. As his trumpet blast sounded before the gate of the citadel, the free lord of arkell here giveth you word and warning that he will fight against you on the morrow. And from the citadel came back this ringing reply, as the knight of leyenburg made answer for his sovereign lady."]]}
wandb/run-20260417_123237-3h84yfea/files/media/table/completions_3_0656117578a4523e0161.table.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"columns": ["step", "prompt", "completion", "ASRWerSubLenCmpHalluDirtyV56", "advantages", "solution"], "data": [["5", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Coordinating and shifting, collectively said she who divided with each other in forming new combinations we must remember however that the flower worship of the teegos performed only a part of their ascetic ritual and it was not a distinct religion by itself.<|im_end|>", 0.14862142503261566, 0.6244527101516724, "kobori enshiu katagiri sekishiu vied with each other in forming new combinations we must remember however that the flower worship of the tea masters formed only a part of their aesthetic ritual and was not a distinct religion by itself"], ["5", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Kohori and shi no kafu ni sei shi no vie with each other in forming new combinations. We must remember, however, that the flower worship of the te deus was formed from only a part of their respective ritual, and it was not a distinct religion by itself.<|im_end|>", -0.41201284527778625, -2.48225474357605, "kobori enshiu katagiri sekishiu vied with each other in forming new combinations we must remember however that the flower worship of the tea masters formed only a part of their aesthetic ritual and was not a distinct religion by itself"], ["5", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Coordinating and shifting, coupling these symphysies, fighting with each other in forming new combinations. We must remember, however, that the flower worship of the timbuctoes formed only a part of their ascetic ritual, and was not a distinct religion by itself.<|im_end|>", 0.05453629419207573, 0.1030879095196724, "kobori enshiu katagiri sekishiu vied with each other in forming new combinations we must remember however that the flower worship of the tea masters formed only a part of their aesthetic ritual and was not a distinct religion by itself"], ["5", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Kohori and mushi, kafanguri and seshishi, fight with each other in forming new combinations. We must remember however that the flower worship of the teengus was formed from only a part of their respective ritual and it was not a distinct religion by itself.<|im_end|>", 0.14244088530540466, 0.5902037620544434, "kobori enshiu katagiri sekishiu vied with each other in forming new combinations we must remember however that the flower worship of the tea masters formed only a part of their aesthetic ritual and was not a distinct religion by itself"], ["5", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Coordinating and shifting, coupling these sub species by way with each other in forming new combinations. We must remember however that the flower worship of the tibetans was formed from only a part of their ascetic ritual, and it was not a distinct religion by itself.<|im_end|>", -0.07631387561559677, -0.6220072507858276, "kobori enshiu katagiri sekishiu vied with each other in forming new combinations we must remember however that the flower worship of the tea masters formed only a part of their aesthetic ritual and was not a distinct religion by itself"], ["5", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Co-ordinating shi'lu, collectively said yishu, vied with each other in forming new combinations. We must remember, however, that the flower worship of the tin gods was but only a part of their respective ritual and it was not a distinct religion by itself.<|im_end|>", 0.05551755055785179, 0.10852545499801636, "kobori enshiu katagiri sekishiu vied with each other in forming new combinations we must remember however that the flower worship of the tea masters formed only a part of their aesthetic ritual and was not a distinct religion by itself"], ["5", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Co-ordinating and shifting, collectively said she, fighting with each other in forming new combinations. We must remember, however, that the flower worship of the teentas was but only a part of their ascetic ritual, and it was not a distinct religion by itself.<|im_end|>", -0.08575789630413055, -0.6743404865264893, "kobori enshiu katagiri sekishiu vied with each other in forming new combinations we must remember however that the flower worship of the tea masters formed only a part of their aesthetic ritual and was not a distinct religion by itself"], ["5", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Cobordia and shibu, kathagunis and yishu divided with each other in forming new combinations. We must remember however that the flower worship of the teengus was formed from only a part of their accepted ritual, and it was not a distinct religion by itself.<|im_end|>", 0.07381142675876617, 0.2098994255065918, "kobori enshiu katagiri sekishiu vied with each other in forming new combinations we must remember however that the flower worship of the tea masters formed only a part of their aesthetic ritual and was not a distinct religion by itself"], ["5", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Coordinating and shifting, catalyzing and dissolving, vying with each other in forming new combinations. We must remember, however, that the flower worship of the tibetans was formed from only a part of their ascetic ritual, and it was not a distinct religion by itself.<|im_end|>", -0.07421640306711197, -0.6103842854499817, "kobori enshiu katagiri sekishiu vied with each other in forming new combinations we must remember however that the flower worship of the tea masters formed only a part of their aesthetic ritual and was not a distinct religion by itself"], ["5", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Kohori and mushi, kafanuise and yishi combined with each other in forming new combinations. We must remember however that the flower worship of the teungus was formed from only a part of their respective ritual and it was not a distinct religion by itself.<|im_end|>", 0.14416144788265228, 0.5997381210327148, "kobori enshiu katagiri sekishiu vied with each other in forming new combinations we must remember however that the flower worship of the tea masters formed only a part of their aesthetic ritual and was not a distinct religion by itself"], ["5", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Coordinating shiuk, collectively said, yishuk, fight with each other in forming new combinations. We must remember however that the flower worship of the tin gods was only a part of their accepted ritual and it was not a distinct religion by itself.<|im_end|>", 0.1842457801103592, 0.8218620419502258, "kobori enshiu katagiri sekishiu vied with each other in forming new combinations we must remember however that the flower worship of the tea masters formed only a part of their aesthetic ritual and was not a distinct religion by itself"], ["5", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Kohori and mushi, katakuri and saki shu, fight with each other in forming new combinations. We must remember however that the flower worship of the tea masters formed only a part of their ascetic ritual, and was not a distinct religion by itself.<|im_end|>", 0.27616366744041443, 1.3312172889709473, "kobori enshiu katagiri sekishiu vied with each other in forming new combinations we must remember however that the flower worship of the tea masters formed only a part of their aesthetic ritual and was not a distinct religion by itself"], ["5", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>With red hot boulders lying about everywhere, do you think it went off well? Creedle he asked, the victuals did that I know, and the drink did that I set fast to believe upon a sound of barrels good honest drink.<|im_end|>", 0.21575099229812622, 0.835888683795929, "with red hot bowlders lying about everywhere do you think it went off well creedle he asked the victuals did that i know and the drink did that i steadfastly believe from the holler sound of the barrels good honest drink"], ["5", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>With red hot bolters flying about everywhere, d'you think it went off well? Creedle he asked her. The bittles did that I know and the drink did that I said passed in belief up on the chaffin barrels good honest strength.<|im_end|>", -0.07250922918319702, -1.3199952840805054, "with red hot bowlders lying about everywhere do you think it went off well creedle he asked the victuals did that i know and the drink did that i steadfastly believe from the holler sound of the barrels good honest drink"], ["5", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>With red hot boulders flying about everywhere, d'you think it went off well at the cradle? He asked her the victuals did that I know and the drink did that I said passed me believe upon a sound of barrels good honest strength.<|im_end|>", -0.02524890936911106, -0.9665377140045166, "with red hot bowlders lying about everywhere do you think it went off well creedle he asked the victuals did that i know and the drink did that i steadfastly believe from the holler sound of the barrels good honest drink"], ["5", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>With red hot boulders lying about everywhere, do you think it went off well? Creedle he asked the victors did that I know and the drink did that I set fast to believe upon a sound of barrels good honest strength.<|im_end|>", 0.2779328227043152, 1.3009434938430786, "with red hot bowlders lying about everywhere do you think it went off well creedle he asked the victuals did that i know and the drink did that i steadfastly believe from the holler sound of the barrels good honest drink"], ["5", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>With red hot boulders lying about everywhere. D'you think it went off while a cradle? He asked her, the victuals did that I know and the drink did that I steadfastly believe upon a sound of barrels good honest drink.<|im_end|>", 0.23886768519878387, 1.0087772607803345, "with red hot bowlders lying about everywhere do you think it went off well creedle he asked the victuals did that i know and the drink did that i steadfastly believe from the holler sound of the barrels good honest drink"], ["5", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>With red hot boulders lying about everywhere, d'you think it went off while cradle? He asked her, the victuals did that I know and the drink did, that I said fastly believe upon a chance of barrels good honest drink.<|im_end|>", 0.015103586949408054, -0.6647433638572693, "with red hot bowlders lying about everywhere do you think it went off well creedle he asked the victuals did that i know and the drink did that i steadfastly believe from the holler sound of the barrels good honest drink"], ["5", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>With red hot boulders lying about everywhere, d'you think it went off well? Creel he asked her the victuals did that I know and the drink did that I said passed me believe up on a chaff in barrels good honest strength.<|im_end|>", -0.05440647527575493, -1.1846057176589966, "with red hot bowlders lying about everywhere do you think it went off well creedle he asked the victuals did that i know and the drink did that i steadfastly believe from the holler sound of the barrels good honest drink"], ["5", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>With red hot boulders lying about everywhere. Did you think it went off well, creedle? He asked me. The victuals did that I know and the drink did, that I said, must be believe upon a sound of barrels good honest strength.<|im_end|>", 0.08476551622152328, -0.14374522864818573, "with red hot bowlders lying about everywhere do you think it went off well creedle he asked the victuals did that i know and the drink did that i steadfastly believe from the holler sound of the barrels good honest drink"], ["5", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>With red hot boulders flying about everywhere. D'you think it went off well, creel? He asked her. The victuals did that I know and the drink did that I steadfastly believe upon a sound of barrels good honest strength.<|im_end|>", 0.2250947505235672, 0.9057701826095581, "with red hot bowlders lying about everywhere do you think it went off well creedle he asked the victuals did that i know and the drink did that i steadfastly believe from the holler sound of the barrels good honest drink"], ["5", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>With red hot bolters flying about everywhere, do you think it went off well? Creel he asked. The biddles did that I know and the drink did that I steadfastly believe upon a sound of barrels good honest drink.<|im_end|>", 0.27579447627067566, 1.2849509716033936, "with red hot bowlders lying about everywhere do you think it went off well creedle he asked the victuals did that i know and the drink did that i steadfastly believe from the holler sound of the barrels good honest drink"], ["5", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>With red hot boulders lying about everywhere, do you think it went off while in the cradle? He asked her. The victuals did that I know, and the drink did that I said passed me believe upon a sound of barrels good honest drink.<|im_end|>", 0.03807579353451729, -0.4929353892803192, "with red hot bowlders lying about everywhere do you think it went off well creedle he asked the victuals did that i know and the drink did that i steadfastly believe from the holler sound of the barrels good honest drink"], ["5", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>With red hot boulders flying about everywhere. D'you think it went off well, creedle? He asked her. The victuals did that I know and the drink did that I set fast in believe upon a sound of barrels good honest drink.<|im_end|>", 0.028604861348867416, -0.5637679696083069, "with red hot bowlders lying about everywhere do you think it went off well creedle he asked the victuals did that i know and the drink did that i steadfastly believe from the holler sound of the barrels good honest drink"], ["5", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>For it is wonderful how names can be acquired by some means. The writer was once employed in teaching a course of lectures to his friends, and repeated very handsome gilding on the colonies of babies which seemed to answer just at once.<|im_end|>", -0.5981812477111816, -0.7124949097633362, "For it is wonderful how soon these are acquired by some horses. The writer was once employed to purchase a horse for a country friend. And he picked a very handsome gelding out of collins's stables, which seemed to answer to his friend's wants."], ["5", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>For it is wonderful how many things may be acquired by some means. The writer was once employed in teaching a boy his arithmetic to French, and repeated very handsome gilding on the colonies of babies, which seems answer to the parents wants.<|im_end|>", -0.6030839681625366, -0.7439505457878113, "For it is wonderful how soon these are acquired by some horses. The writer was once employed to purchase a horse for a country friend. And he picked a very handsome gelding out of collins's stables, which seemed to answer to his friend's wants."], ["5", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>For it is wonderful how a name can be acquired by some means. The writer was once employed in purchasing a horse for his brother's friend, and he picked up mary hansen gelding on the collins estate, which seems answer to his friend's wants.<|im_end|>", -0.16422338783740997, 2.071758270263672, "For it is wonderful how soon these are acquired by some horses. The writer was once employed to purchase a horse for a country friend. And he picked a very handsome gelding out of collins's stables, which seemed to answer to his friend's wants."], ["5", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>For it is wonderful how many names have been supplied by some of us. The writer was once employed in teaching a course of lectures on French, and repeated Mary hansen gellin on the colonies of ladies, which seems answerable to his friend's wants.<|im_end|>", -0.6562139391899109, -1.0848299264907837, "For it is wonderful how soon these are acquired by some horses. The writer was once employed to purchase a horse for a country friend. And he picked a very handsome gelding out of collins's stables, which seemed to answer to his friend's wants."], ["5", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>For it is wonderful how many things can be acquired by some means a writer was once employed in preaching authority from scripture to friends, and he picked up mary hansen gelding on the colony of cape town, which seems answer to his friend's wants.<|im_end|>", -0.48777177929878235, -0.00411293376237154, "For it is wonderful how soon these are acquired by some horses. The writer was once employed to purchase a horse for a country friend. And he picked a very handsome gelding out of collins's stables, which seemed to answer to his friend's wants."], ["5", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>For it is wonderful how names may be acquired by some means a writer was once employed in purchase of horses from a friend and repeated mary hansen gilding on the colony of scotland which seems answer to his friend's want.<|im_end|>", -0.45017996430397034, 0.23707440495491028, "For it is wonderful how soon these are acquired by some horses. The writer was once employed to purchase a horse for a country friend. And he picked a very handsome gelding out of collins's stables, which seemed to answer to his friend's wants."], ["5", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>For it is wonderful how men can be inspired by some of these things. The writer was once employed in purchase of horses from his friends, and they picked up very handsome geldings on the colonies of cape verd which seemed to answer just such wants.<|im_end|>", -0.5413256883621216, -0.34771230816841125, "For it is wonderful how soon these are acquired by some horses. The writer was once employed to purchase a horse for a country friend. And he picked a very handsome gelding out of collins's stables, which seemed to answer to his friend's wants."], ["5", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>For it is wonderful how names may be acquired by some means a writer was once employed in purchase of one such book from his friend and repeated mary hansen gelling on the colonies of ceders which seems answer to his friend's wants.<|im_end|>", -0.5219820141792297, -0.2236042022705078, "For it is wonderful how soon these are acquired by some horses. The writer was once employed to purchase a horse for a country friend. And he picked a very handsome gelding out of collins's stables, which seemed to answer to his friend's wants."], ["5", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>For it is wonderful how a name can be acquired by some means. The writer was once employed in teaching a course of lectures on French, and repeated Mary henson gilding on the colonies of Canada, which seems answer to his friend's wants.<|im_end|>", -0.4530133306980133, 0.21889565885066986, "For it is wonderful how soon these are acquired by some horses. The writer was once employed to purchase a horse for a country friend. And he picked a very handsome gelding out of collins's stables, which seemed to answer to his friend's wants."], ["5", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>For it is wonderful how many things are required by some of us. The writer was once employed in preaching before a large company at friends, and repeated with very handsome gilding on the columns of statius which seems answer to his friend's wants.<|im_end|>", -0.5449039340019226, -0.3706701695919037, "For it is wonderful how soon these are acquired by some horses. The writer was once employed to purchase a horse for a country friend. And he picked a very handsome gelding out of collins's stables, which seemed to answer to his friend's wants."], ["5", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>For it is wonderful how many things can be acquired by some means a writer was once employed in purchase of horses from his friends and he picked up very handsome geldings on the colonies of cape cruz which seemed to answer to his friend's wants.<|im_end|>", -0.20373354852199554, 1.8182631731033325, "For it is wonderful how soon these are acquired by some horses. The writer was once employed to purchase a horse for a country friend. And he picked a very handsome gelding out of collins's stables, which seemed to answer to his friend's wants."], ["5", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>For it is wonderful how men may be inspired by some muse a writer was once employed in which office he got continual friends and made pictures very handsome gilding on the columns of statues which seems answer to his friend's wants.<|im_end|>", -0.6209558844566345, -0.8586159348487854, "For it is wonderful how soon these are acquired by some horses. The writer was once employed to purchase a horse for a country friend. And he picked a very handsome gelding out of collins's stables, which seemed to answer to his friend's wants."], ["5", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>A week after the battle, my brother replied there on a capital expedition to make a horrible discovery that involved eating up the bodies of our dead heroes. That too was worth it.<|im_end|>", 0.11993206292390823, 0.7482782602310181, "a week after the battle my brother rode by there on a cavalry expedition and made the horrible discovery that hogs were eating up the bodies of our dead heroes that too was war"], ["5", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>A week after the battle, my brother was invited by a cavalry expedition to make a horrible supper at a hall in the eating of the bodies of our dead heroes. That too is over.<|im_end|>", -0.41032978892326355, -1.1197341680526733, "a week after the battle my brother rode by there on a cavalry expedition and made the horrible discovery that hogs were eating up the bodies of our dead heroes that too was war"], ["5", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>A week after the battle, my brother took a lighter and captured my expedition to make the horrible discovery that all were eating up the bodies of our dead heroes. That too was worth it.<|im_end|>", 0.021145427599549294, 0.40027153491973877, "a week after the battle my brother rode by there on a cavalry expedition and made the horrible discovery that hogs were eating up the bodies of our dead heroes that too was war"], ["5", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>A week after the battle, my brother stood by her on the scaffold in my position and made a horrible discovery that I had caught the beating of the pines of our dead heroes. That too was worth it.<|im_end|>", -0.47986671328544617, -1.3646996021270752, "a week after the battle my brother rode by there on a cavalry expedition and made the horrible discovery that hogs were eating up the bodies of our dead heroes that too was war"], ["5", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>A week after the battle, my brother was invited by a capital man of business to make a horrible discovery at home, eating up the bodies of our dead heroes. That too was worth it.<|im_end|>", -0.32124173641204834, -0.8058937788009644, "a week after the battle my brother rode by there on a cavalry expedition and made the horrible discovery that hogs were eating up the bodies of our dead heroes that too was war"], ["5", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>A week after the battle, my brother replied there in a cavalry expedition to make a horrible discovery at home of the bodies of our dead heroes. That too was worth it.<|im_end|>", -0.12081809341907501, -0.09983913600444794, "a week after the battle my brother rode by there on a cavalry expedition and made the horrible discovery that hogs were eating up the bodies of our dead heroes that too was war"], ["5", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>A week after the battle, my brother replied there in a capital translation to me the horrible discovery that all were eating up the bodies of our dead heroes. That too was worth it.<|im_end|>", 0.1116841584444046, 0.7192224264144897, "a week after the battle my brother rode by there on a cavalry expedition and made the horrible discovery that hogs were eating up the bodies of our dead heroes that too was war"], ["5", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>A week after the battle, my brother was invited by our cavalry expedition to make a horrible supper at a hall meeting of the bodies of our dead heroes. That too was ordered.<|im_end|>", -0.3647739291191101, -0.9592495560646057, "a week after the battle my brother rode by there on a cavalry expedition and made the horrible discovery that hogs were eating up the bodies of our dead heroes that too was war"], ["5", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>A week after the battle, my brother replied there from the capital of my expedition, he made a horrible discovery that called for eating up the bodies of our dead heroes. That too was ordered.<|im_end|>", -0.16730603575706482, -0.263607382774353, "a week after the battle my brother rode by there on a cavalry expedition and made the horrible discovery that hogs were eating up the bodies of our dead heroes that too was war"], ["5", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>A week after the battle, my brother replied there from a cavalry expedition and made a horrible discovery that called the eating of the bodies of our dead heroes. That too was war.<|im_end|>", 0.26659682393074036, 1.2649505138397217, "a week after the battle my brother rode by there on a cavalry expedition and made the horrible discovery that hogs were eating up the bodies of our dead heroes that too was war"], ["5", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>A week after the battle, my brother replied there on a capital expedition to make the horrible discovery that he had fallen in the eating of the pies of our dead heroes. That too was a word.<|im_end|>", -0.18637478351593018, -0.3307829797267914, "a week after the battle my brother rode by there on a cavalry expedition and made the horrible discovery that hogs were eating up the bodies of our dead heroes that too was war"], ["5", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>A week after the battle, my brother rode by there on a cavalry expedition to make the horrible discovery that Paul was eating up the bodies of our dead heroes. That too is worth.<|im_end|>", 0.4216246008872986, 1.8110840320587158, "a week after the battle my brother rode by there on a cavalry expedition and made the horrible discovery that hogs were eating up the bodies of our dead heroes that too was war"]]}
wandb/run-20260417_123237-3h84yfea/files/media/table/completions_5_f2bf6a8e887194296a09.table.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"columns": ["step", "prompt", "completion", "ASRWerSubLenCmpHalluDirtyV56", "advantages", "solution"], "data": [["10", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Instead of listening to you, I tell you that from this day forward, I will give that great man a pension of a thousand pieces of gold per month for his life. Nay, though I were to share with him all my riches and dominions.<|im_end|>", 0.7513310313224792, -0.40651965141296387, "instead of listening to you i tell you that from this day forward i will give that great man a pension of a thousand pieces of gold per month for his life nay though i were to share with him all my riches and dominions"], ["10", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Instead of listening to you, I tell you that from this day forward, I will give that great man a pension of a thousand pieces of gold per month for his life. Nay, though I were to share with him all my riches and provisions.<|im_end|>", 0.7468931674957275, -0.49668067693710327, "instead of listening to you i tell you that from this day forward i will give that great man a pension of a thousand pieces of gold per month for his life nay though i were to share with him all my riches and dominions"], ["10", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Instead of listening to you, I tell you that from this day forward, I will give that great man a pension of a thousand pieces of gold per month for his life. Nay, though I were to share with him all my riches and dominions.<|im_end|>", 0.7513310313224792, -0.40651965141296387, "instead of listening to you i tell you that from this day forward i will give that great man a pension of a thousand pieces of gold per month for his life nay though i were to share with him all my riches and dominions"], ["10", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Instead of listening to you, I tell you that from this day forward, I will give that great man a pension of a thousand pieces of gold per month for his life. Nay, though I were to share with him all my riches and dominions.<|im_end|>", 0.7513310313224792, -0.40651965141296387, "instead of listening to you i tell you that from this day forward i will give that great man a pension of a thousand pieces of gold per month for his life nay though i were to share with him all my riches and dominions"], ["10", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Instead of listening to you, I tell you that from this day forward, I will give that great man a pension of a thousand pieces of gold per month for his life. Nay, though I were to share with him all my riches and dominions.<|im_end|>", 0.7513310313224792, -0.40651965141296387, "instead of listening to you i tell you that from this day forward i will give that great man a pension of a thousand pieces of gold per month for his life nay though i were to share with him all my riches and dominions"], ["10", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Instead of listening to you, I tell you that from this day forward, I will give that great man a pension of a thousand pieces of gold per month for his life. Nay, though I were to share with him all my riches and dominions.<|im_end|>", 0.7513310313224792, -0.40651965141296387, "instead of listening to you i tell you that from this day forward i will give that great man a pension of a thousand pieces of gold per month for his life nay though i were to share with him all my riches and dominions"], ["10", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Instead of listening to you, I tell you that from this day forward, I will give that great man a pension of a thousand pieces of gold per month for his life. Nay, though I were to share with him all my riches and dominions.<|im_end|>", 0.7513310313224792, -0.40651965141296387, "instead of listening to you i tell you that from this day forward i will give that great man a pension of a thousand pieces of gold per month for his life nay though i were to share with him all my riches and dominions"], ["10", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Instead of listening to you, I tell you that from this day forward, I will give that great man a pension of a thousand pieces of gold per month for his life. Nay, though I were to share with him all my riches and dominions.<|im_end|>", 0.7513310313224792, -0.40651965141296387, "instead of listening to you i tell you that from this day forward i will give that great man a pension of a thousand pieces of gold per month for his life nay though i were to share with him all my riches and dominions"], ["10", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Instead of listening to you, I tell you that from this day forward I will give that great man a pension of a thousand pieces of gold per month for his life nay, though I were to share with him all my riches and provisions<|im_end|>", 0.8469211459159851, 1.5355191230773926, "instead of listening to you i tell you that from this day forward i will give that great man a pension of a thousand pieces of gold per month for his life nay though i were to share with him all my riches and dominions"], ["10", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Instead of listening to you, I tell you that from this day forward, I will give that great man a pension of a thousand pieces of gold per month for his life nay though I were to share with him all my riches and dominions<|im_end|>", 0.9002925753593445, 2.6198298931121826, "instead of listening to you i tell you that from this day forward i will give that great man a pension of a thousand pieces of gold per month for his life nay though i were to share with him all my riches and dominions"], ["10", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Instead of listening to you, I tell you that from this day forward, I will give that great man a pension of a thousand pieces of gold per month for his life. Nay, though I were to share with him all my riches and dominions.<|im_end|>", 0.7513310313224792, -0.40651965141296387, "instead of listening to you i tell you that from this day forward i will give that great man a pension of a thousand pieces of gold per month for his life nay though i were to share with him all my riches and dominions"], ["10", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Instead of listening to you, I tell you that from this day forward, I will give that great man a pension of a thousand pieces of gold per month for his life. Nay, though I were to share with him all my riches and dominions.<|im_end|>", 0.7513310313224792, -0.40651965141296387, "instead of listening to you i tell you that from this day forward i will give that great man a pension of a thousand pieces of gold per month for his life nay though i were to share with him all my riches and dominions"], ["10", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>The baker shook his head, the crime which I have committed now or has no place among you in justice. And you can only deliver me from it by blessing me secretly as you have just done come, put hand before the persecutor.<|im_end|>", -0.023505905643105507, -0.4367395341396332, "The beggar shook his head. The crime which I have committed, my lord, has no call upon human justice. And you can only deliver me from it by blessing me frequently, as you have just done. Come be candid, said the coadjutor."], ["10", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>The baker shook his head, the crime which I have committed now will have no cause of human injustice. And you can only deliver me from it by blessing this wicked day as you have just done. Come, my candids said the presider.<|im_end|>", -0.021910538896918297, -0.4288407862186432, "The beggar shook his head. The crime which I have committed, my lord, has no call upon human justice. And you can only deliver me from it by blessing me frequently, as you have just done. Come be candid, said the coadjutor."], ["10", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>The baker shook his head, the crime which I have committed now will be called upon you in justice and you can only deliver me from it by blessing this sacred day as you have just done come let's end it said the presider.<|im_end|>", -0.23740261793136597, -1.495755672454834, "The beggar shook his head. The crime which I have committed, my lord, has no call upon human justice. And you can only deliver me from it by blessing me frequently, as you have just done. Come be candid, said the coadjutor."], ["10", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>The baker shook his head, but the crime which I have committed now is too large for any injustice and you can only deliver me from it by blessing me secretly as you have just done. Come up hand before the persecutor.<|im_end|>", -0.08132755011320114, -0.7230181097984314, "The beggar shook his head. The crime which I have committed, my lord, has no call upon human justice. And you can only deliver me from it by blessing me frequently, as you have just done. Come be candid, said the coadjutor."], ["10", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>The baker shook his head, the crime which I have committed now or has just passed on me of justice and you can only deliver me from it by blessing me frequently as you have just done come with candor said the presider.<|im_end|>", -0.018306119367480278, -0.4109950661659241, "The beggar shook his head. The crime which I have committed, my lord, has no call upon human justice. And you can only deliver me from it by blessing me frequently, as you have just done. Come be candid, said the coadjutor."], ["10", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>The baker shook his head, the crime which I have committed now won't hold you call upon human justice, and you can only deliver me from it by blessing this secret way as you have just done. Come with candor said the persecutor.<|im_end|>", 0.11918030679225922, 0.26970887184143066, "The beggar shook his head. The crime which I have committed, my lord, has no call upon human justice. And you can only deliver me from it by blessing me frequently, as you have just done. Come be candid, said the coadjutor."], ["10", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>The baker shook his head. The crime which I have committed, my lord has no cause of human justice, and you can only deliver me from it by blessing me frequently as you have just done come with candor said the presider.<|im_end|>", 0.3861045837402344, 1.591267704963684, "The beggar shook his head. The crime which I have committed, my lord, has no call upon human justice. And you can only deliver me from it by blessing me frequently, as you have just done. Come be candid, said the coadjutor."], ["10", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>The beggar shook his head, the crime which I have committed now or has been called upon me by justice, and you can only deliver me from it by blessing me secretly as you have just done come with candor said the porter to juno.<|im_end|>", 0.011092587374150753, -0.2654402256011963, "The beggar shook his head. The crime which I have committed, my lord, has no call upon human justice. And you can only deliver me from it by blessing me frequently, as you have just done. Come be candid, said the coadjutor."], ["10", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>The beggar shook his head, the crime which I have committed now would have no place among you in justice, and you can only deliver me from it by blessing me frequently as you have just done come with candids said the porter turtle.<|im_end|>", -0.0024881232529878616, -0.3326791822910309, "The beggar shook his head. The crime which I have committed, my lord, has no call upon human justice. And you can only deliver me from it by blessing me frequently, as you have just done. Come be candid, said the coadjutor."], ["10", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>The beggar shook his head, the crime which I have committed, my lord has no palliation in justice, and you can only deliver me from it by blessing me frequently as you have just done. Come with candor said the procurator.<|im_end|>", 0.3988274335861206, 1.6542593240737915, "The beggar shook his head. The crime which I have committed, my lord, has no call upon human justice. And you can only deliver me from it by blessing me frequently, as you have just done. Come be candid, said the coadjutor."], ["10", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>The beggar shook his head, the crime which I have committed, my lord, has no place among you in justice, and you can only deliver me from it by blessing me secretly as you have just done come with candids said the presbyter.<|im_end|>", 0.32486215233802795, 1.2880525588989258, "The beggar shook his head. The crime which I have committed, my lord, has no call upon human justice. And you can only deliver me from it by blessing me frequently, as you have just done. Come be candid, said the coadjutor."], ["10", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>The beggar shook his head, decline which I have permitted my lord has no cause for any injustice and you can only deliver me from it by blessing us equally as you have just done come but hand it to the procurator.<|im_end|>", -0.07866184413433075, -0.709820032119751, "The beggar shook his head. The crime which I have committed, my lord, has no call upon human justice. And you can only deliver me from it by blessing me frequently, as you have just done. Come be candid, said the coadjutor."], ["10", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>What was Hamphill's great and enduring jubilation with the emotions that stirred within him when he first bushwhacked his seeming grey matter? It was stirred the remembrance that Pontiac had warned them that women were robbing the house you mean a woman.<|im_end|>", -0.49033617973327637, 0.36183518171310425, "the buttons on phelan's coat were fairly undulating with the emotions that stirred within him in his seething gray matter there stirred the remembrance that bateato had told him that women were robbing the house you mean the women"], ["10", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>What was Hamphair's great concern, accumulating with the emotions that stirred within him when he first bushwhacked his seemingly gray matter? There stirred the remembrance that but a few moments ago, that women were robbing the house you mean the women.<|im_end|>", -0.30832746624946594, 0.963458776473999, "the buttons on phelan's coat were fairly undulating with the emotions that stirred within him in his seething gray matter there stirred the remembrance that bateato had told him that women were robbing the house you mean the women"], ["10", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>So she did button some papers away and started accumulating with the emotions that stirred within one night for a first bushwacker in his seeming gray matter there stirred the remembrance that monte agello had told them women were robbing the house you mean the sheriff<|im_end|>", -0.4897034466266632, 0.3639266788959503, "the buttons on phelan's coat were fairly undulating with the emotions that stirred within him in his seething gray matter there stirred the remembrance that bateato had told him that women were robbing the house you mean the women"], ["10", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>The buttons of phaeton's coat were accumulating with the emotions that stirred within one at first bushwick in his seeming gray matter there stirred the remembrance that monteagle had told them women were riding the house you mean a woman<|im_end|>", 0.051824573427438736, 2.1539289951324463, "the buttons on phelan's coat were fairly undulating with the emotions that stirred within him in his seething gray matter there stirred the remembrance that bateato had told him that women were robbing the house you mean the women"], ["10", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>But in some paler, gray and dreary, accumulating with the emotions that stirred within one like hers bushwick's eyes did seem in grey matter there stirred the remembrance that batty apples had been at Quinn's for riding the house you mean the sheriff?<|im_end|>", -0.8388098478317261, -0.7900326251983643, "the buttons on phelan's coat were fairly undulating with the emotions that stirred within him in his seething gray matter there stirred the remembrance that bateato had told him that women were robbing the house you mean the women"], ["10", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>She caught some faint expression of fear, mingling with the emotions that stirred within her when she first beheld this hideous beast. His seeming gray matter evoked the remembrance that battyappo had told them women were rotting in the house you mean a woman?<|im_end|>", -0.7576847672462463, -0.5218764543533325, "the buttons on phelan's coat were fairly undulating with the emotions that stirred within him in his seething gray matter there stirred the remembrance that bateato had told him that women were robbing the house you mean the women"], ["10", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>But some feelings which were accumulating with the emotions that stirred within one's heart for a perverse bushman did seem in gray matter to stir the remembrance that botany had reported that women were riding the house you mean, of women.<|im_end|>", -0.6848458051681519, -0.2811097204685211, "the buttons on phelan's coat were fairly undulating with the emotions that stirred within him in his seething gray matter there stirred the remembrance that bateato had told him that women were robbing the house you mean the women"], ["10", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>What had some feelings greatly intermingling with the emotions that stirred within one at first bushwick and his seemingly gray matter there stirred the remembrance that but a few weeks ago, when women were rioting in the house you mean the sheriff<|im_end|>", -0.537434458732605, 0.20615343749523163, "the buttons on phelan's coat were fairly undulating with the emotions that stirred within him in his seething gray matter there stirred the remembrance that bateato had told him that women were robbing the house you mean the women"], ["10", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>So she did buttons of phaeton's face was very stimulating with the emotions that stirred within one like her own it seemed in gray matter there stirred the remembrance that but a half hour ago, that women were riding the house you mean the women.<|im_end|>", -0.5774927735328674, 0.07374204695224762, "the buttons on phelan's coat were fairly undulating with the emotions that stirred within him in his seething gray matter there stirred the remembrance that bateato had told him that women were robbing the house you mean the women"], ["10", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>She thought some palates of bacon, and very stimulating with the emotions that stirred within one heart for the first bushwacker in his seeming gray matter there stirred the remembrance that but a little before that women were riding the house you mean a woman.<|im_end|>", -0.5789588689804077, 0.06889592111110687, "the buttons on phelan's coat were fairly undulating with the emotions that stirred within him in his seething gray matter there stirred the remembrance that bateato had told him that women were robbing the house you mean the women"], ["10", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>To shiver buttons had failed to wake him and he was still accumulating with the emotions that stirred within him when they first met in his seemingly grey matter there stirred the remembrance that but a few weeks before women were riding the house you mean the ship?<|im_end|>", -0.8068899512290955, -0.6845225095748901, "the buttons on phelan's coat were fairly undulating with the emotions that stirred within him in his seething gray matter there stirred the remembrance that bateato had told him that women were robbing the house you mean the women"], ["10", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>So she heard buttons, having failed to wake him, began accumulating with the emotions that stirred within her when he first pushed me aside in his seemingly grave manner and restored the remembrance that battyata was one of them who were riding the house you mean a servant.<|im_end|>", -1.1789628267288208, -1.9143966436386108, "the buttons on phelan's coat were fairly undulating with the emotions that stirred within him in his seething gray matter there stirred the remembrance that bateato had told him that women were robbing the house you mean the women"], ["10", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>They set up the side show early in the morning before the first guest arrived at park.<|im_end|>", 0.5806475877761841, -0.7072128057479858, "They set up the sideshow early in the morning before the first guests arrived at park."], ["10", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>They set up the side show early in the morning before the first guests arrived at park.<|im_end|>", 0.7450000047683716, 0.4686703085899353, "They set up the sideshow early in the morning before the first guests arrived at park."], ["10", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>They set up the side show early in the morning before the first guests arrived at park.<|im_end|>", 0.7450000047683716, 0.4686703085899353, "They set up the sideshow early in the morning before the first guests arrived at park."], ["10", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>They set up the side show early in the morning before the first guest arrived at park.<|im_end|>", 0.5806475877761841, -0.7072128057479858, "They set up the sideshow early in the morning before the first guests arrived at park."], ["10", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>They set up the side show early in the morning before the first guest arrived at park.<|im_end|>", 0.5806475877761841, -0.7072128057479858, "They set up the sideshow early in the morning before the first guests arrived at park."], ["10", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>They set up the side show early in the morning before the first guest arrived at park.<|im_end|>", 0.5806475877761841, -0.7072128057479858, "They set up the sideshow early in the morning before the first guests arrived at park."], ["10", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>They set up the side show early in the morning before the first guest arrived at park.<|im_end|>", 0.5806475877761841, -0.7072128057479858, "They set up the sideshow early in the morning before the first guests arrived at park."], ["10", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>They set up the side show early in the morning before the first guests arrived at park.<|im_end|>", 0.7450000047683716, 0.4686703085899353, "They set up the sideshow early in the morning before the first guests arrived at park."], ["10", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>They set up the sideshow early in the morning before the first guest arrived at park.<|im_end|>", 0.8543975949287415, 1.251371145248413, "They set up the sideshow early in the morning before the first guests arrived at park."], ["10", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>They set up the side show early in the morning before the first guest arrived at park.<|im_end|>", 0.5806475877761841, -0.7072128057479858, "They set up the sideshow early in the morning before the first guests arrived at park."], ["10", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>They set up the sideshow early in the morning before the first guests arrived at park.<|im_end|>", 1.0, 2.293104648590088, "They set up the sideshow early in the morning before the first guests arrived at park."], ["10", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>They set up the side show early in the morning before the first guest arrived at park.<|im_end|>", 0.5806475877761841, -0.7072128057479858, "They set up the sideshow early in the morning before the first guests arrived at park."]]}
wandb/run-20260417_123237-3h84yfea/files/media/table/completions_7_4930391b310cfe338705.table.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"columns": ["step", "prompt", "completion", "ASRWerSubLenCmpHalluDirtyV56", "advantages", "solution"], "data": [["15", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>darted furious glances at one another what they meant certainly which looked well for us all got out a long box and sawn it in severe weather well every ship drew upon side five on the other with a pit between us<|im_end|>", -0.711168646812439, -1.6506024599075317, "darting furious glances behind them one thing i observed which looked well for us they all got out upon the opposite side from silver well there we stood two on one side five on the other the pit between us"], ["15", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Darling, furious glances were coming from her one thing I am certain which looked well for us all got out along tops and sides of this hill well there we stood two on one side five on the other with a pit between us<|im_end|>", -0.056266773492097855, 0.6078363656997681, "darting furious glances behind them one thing i observed which looked well for us they all got out upon the opposite side from silver well there we stood two on one side five on the other the pit between us"], ["15", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>darted furious glances in our direction. One thing I am certain, which looked well for us, we all got out upon puffs and sighs of superiority. Well, every stroke two on one side five on the other was a pity to me as.<|im_end|>", -0.5369827151298523, -1.0499197244644165, "darting furious glances behind them one thing i observed which looked well for us they all got out upon the opposite side from silver well there we stood two on one side five on the other the pit between us"], ["15", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>darted furious glances about one thing I am certain which looked well for us all got out of our cloaks and stockings well every ship drew upon side five on the other to pick each others<|im_end|>", -0.4635177254676819, -0.796574592590332, "darting furious glances behind them one thing i observed which looked well for us they all got out upon the opposite side from silver well there we stood two on one side five on the other the pit between us"], ["15", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>darting furious glances at one another, one thing i am certain which looked well for us we all got out on the opposite side and disappeared. Well, there we stood two upon one side five on the other in a pit between us.<|im_end|>", 0.12982679903507233, 1.2495828866958618, "darting furious glances behind them one thing i observed which looked well for us they all got out upon the opposite side from silver well there we stood two on one side five on the other the pit between us"], ["15", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>darted furious glances about one thing I am certain which looked well for us we all got out upon blocks and sides of the sewer well there we stood two on one side five on the other with a pit between us<|im_end|>", 0.13510093092918396, 1.267770767211914, "darting furious glances behind them one thing i observed which looked well for us they all got out upon the opposite side from silver well there we stood two on one side five on the other the pit between us"], ["15", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Darling furious and lenses were out of order one thing I am certain which looked well for us we all got out upon tops and sides in the severe weather well there we stood two on one side five on the other the pit between us<|im_end|>", -0.07753195613622665, 0.5345030426979065, "darting furious glances behind them one thing i observed which looked well for us they all got out upon the opposite side from silver well there we stood two on one side five on the other the pit between us"], ["15", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>darted furious glances about one thing I am certain which looked well for us all got out of our cloths and stockings and stood up well every ship two on one side five on the other with a pit between us<|im_end|>", -0.21955648064613342, 0.04472939670085907, "darting furious glances behind them one thing i observed which looked well for us they all got out upon the opposite side from silver well there we stood two on one side five on the other the pit between us"], ["15", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Darling, furious and wenceslas had been there. One thing I am certain which looked well for us all got out upon foxes' side. It was clear enough. Well, every ship drew one side five on the other to pit between us.<|im_end|>", -0.45566949248313904, -0.7695098519325256, "darting furious glances behind them one thing i observed which looked well for us they all got out upon the opposite side from silver well there we stood two on one side five on the other the pit between us"], ["15", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>darting furious glances about one thing I am certain, which looked well for us, they all got out of our plots and sawdust in a secure way well every stroke drew upon one side five on the other the pit being full as<|im_end|>", -0.4559590816497803, -0.7705084681510925, "darting furious glances behind them one thing i observed which looked well for us they all got out upon the opposite side from silver well there we stood two on one side five on the other the pit between us"], ["15", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Darting furious glances about them one thing I am certain which looked well for us all got out a long cloth and sat in the middle of it well there we stood two on one side, five on the other with a picnic box<|im_end|>", -0.2022235095500946, 0.10450240224599838, "darting furious glances behind them one thing i observed which looked well for us they all got out upon the opposite side from silver well there we stood two on one side five on the other the pit between us"], ["15", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>darted furious glances about them one thing I am certain which looked well for us all got out along tops and sides of this hill well there we stood two on one side five on the other to pick between us<|im_end|>", 0.12362368404865265, 1.2281913757324219, "darting furious glances behind them one thing i observed which looked well for us they all got out upon the opposite side from silver well there we stood two on one side five on the other the pit between us"], ["15", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>I would have cherished you with all my heart, said Peterloo as we might be separated to a citizen of another world. But let's converse with regard to those who have grown up in another land and who soon after arriving here are engaged in our service.<|im_end|>", -0.25535303354263306, -0.2316378802061081, "are both opposed to the formation of such views and habits as we think desirable to the citizen of the new world we answer first with regard to those who have grown up in another land and who soon after arriving here are engaged in our service"], ["15", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Are both of a distinguished and noble descent in these islands, as we might be said to be citizens of every world. The next verse is with regard to those who have grown up in another land and who soon after arriving here are engaged in our service.<|im_end|>", -0.19704824686050415, 0.17174986004829407, "are both opposed to the formation of such views and habits as we think desirable to the citizen of the new world we answer first with regard to those who have grown up in another land and who soon after arriving here are engaged in our service"], ["15", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Our brother ships should be called in such cases as these and matters, as we might consider them to a citizen of your own world, events of personal regard to those who have grown up in another land and who soon after arriving here are engaged in our service.<|im_end|>", -0.29079490900039673, -0.47684618830680847, "are both opposed to the formation of such views and habits as we think desirable to the citizen of the new world we answer first with regard to those who have grown up in another land and who soon after arriving here are engaged in our service"], ["15", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Our brothers, who have gone before us into these lands, as we might consider him to be a citizen of our own world. The next verse with regard to those who have grown up in another land and who soon after arriving here are engaged in our service.<|im_end|>", -0.3025875687599182, -0.5584349632263184, "are both opposed to the formation of such views and habits as we think desirable to the citizen of the new world we answer first with regard to those who have grown up in another land and who soon after arriving here are engaged in our service"], ["15", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Our obligations to your royal majesty extend to these premises as we might be said to have to a citizen of the old world in answer first with regard to those who have grown up in another land and who soon after arriving here are engaged in our service.<|im_end|>", -0.027638815343379974, 1.3438266515731812, "are both opposed to the formation of such views and habits as we think desirable to the citizen of the new world we answer first with regard to those who have grown up in another land and who soon after arriving here are engaged in our service"], ["15", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Are both distinguished by their voluntary services to these islands, as we might be said of him who is a citizen of every world. The next reverse with regard to those who have grown up in another land and who soon after arriving here are engaged in our service.<|im_end|>", -0.32690533995628357, -0.7266799807548523, "are both opposed to the formation of such views and habits as we think desirable to the citizen of the new world we answer first with regard to those who have grown up in another land and who soon after arriving here are engaged in our service"], ["15", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Are of a special duty of honour and respect to these inhabitants, as we might consider him to be a citizen of their own world. The next in personal regard to those who have grown up in another land, and who soon after arriving here are engaged in our service.<|im_end|>", -0.4352739751338959, -1.4764397144317627, "are both opposed to the formation of such views and habits as we think desirable to the citizen of the new world we answer first with regard to those who have grown up in another land and who soon after arriving here are engaged in our service"], ["15", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Are of a just and good moral disposition, as we might conceive them to be citizens of our own world. They answer first with regard to those who have grown up in another land and who, soon after arriving here, are engaged in our service.<|im_end|>", -0.22580717504024506, -0.027221782132983208, "are both opposed to the formation of such views and habits as we think desirable to the citizen of the new world we answer first with regard to those who have grown up in another land and who soon after arriving here are engaged in our service"], ["15", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Our brothers, who have fallen in service to these commandments as we might consider them to a citizen of our own land, and answer first with regard to those who have grown up in another land and who soon after arriving here are engaged in our service.<|im_end|>", -0.11624263226985931, 0.7308119535446167, "are both opposed to the formation of such views and habits as we think desirable to the citizen of the new world we answer first with regard to those who have grown up in another land and who soon after arriving here are engaged in our service"], ["15", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Above which we have formed ourselves these premises as we might consider them to a citizen of the whole world, and answer first with regard to those who have grown up in another land and who soon after arriving here are engaged in our service.<|im_end|>", -0.029811272397637367, 1.3287962675094604, "are both opposed to the formation of such views and habits as we think desirable to the citizen of the new world we answer first with regard to those who have grown up in another land and who soon after arriving here are engaged in our service"], ["15", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Our obligations to the colonies of these islands, as we might consider them to a citizen of our own world, increase in force with regard to those who have grown up in another land and who soon after arriving here are engaged in our service.<|im_end|>", -0.03507249057292938, 1.292396068572998, "are both opposed to the formation of such views and habits as we think desirable to the citizen of the new world we answer first with regard to those who have grown up in another land and who soon after arriving here are engaged in our service"], ["15", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Our brotherhood should be formed in such a way as to these matters, as we might conceive it were to a citizen of our own country. The next verse with regard to those who have grown up in another land and who soon after arriving here are engaged in our service.<|im_end|>", -0.4199356734752655, -1.3703200817108154, "are both opposed to the formation of such views and habits as we think desirable to the citizen of the new world we answer first with regard to those who have grown up in another land and who soon after arriving here are engaged in our service"], ["15", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>For seeing my weakly temper, said missus clark's manager of her daughter ashamed that she helped hide the poverty of her child in all the grand qualities which she herself possessed unconsciously and which she set so high a value upon with others.<|im_end|>", 0.046360768377780914, 0.4103975296020508, "which the uneasy tenderness of missus thornton's manner to her daughter the shame with which she thought to hide the poverty of her child in all the grand qualities which she herself possessed unconsciously and which she set so high a value upon in others"], ["15", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>For steam, with easy tenderness said missus sloan's manager of her daughter ashamed that she helped hide the poverty of her child in all the grander qualities which she herself possessed unconsciously and which she set so high a value upon with others.<|im_end|>", 0.05154683068394661, 0.44836360216140747, "which the uneasy tenderness of missus thornton's manner to her daughter the shame with which she thought to hide the poverty of her child in all the grand qualities which she herself possessed unconsciously and which she set so high a value upon in others"], ["15", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>For seeing my really tender and sympathetic ways of managing her daughter, ashamed that she helped to hide the poverty of her child in all the grander qualities which she herself possessed unconsciously and which she set so high a value upon with others.<|im_end|>", -0.11499068140983582, -0.7708224654197693, "which the uneasy tenderness of missus thornton's manner to her daughter the shame with which she thought to hide the poverty of her child in all the grand qualities which she herself possessed unconsciously and which she set so high a value upon in others"], ["15", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>For Stephen, easily tender said missus holmes managed her daughter ashamed that she helped to hide the poverty of her child in all the grander qualities which she herself possessed unconsciously and which she set so high a value upon with others.<|im_end|>", 0.10173752903938293, 0.8157991170883179, "which the uneasy tenderness of missus thornton's manner to her daughter the shame with which she thought to hide the poverty of her child in all the grand qualities which she herself possessed unconsciously and which she set so high a value upon in others"], ["15", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>for she had a really tender sense of missus holmes's management of her daughter ashamed that she helped to hide the poverty of her child in all the grander qualities which she herself possessed unconsciously and which she set so high a value upon with others<|im_end|>", 0.06310267001390457, 0.5329614281654358, "which the uneasy tenderness of missus thornton's manner to her daughter the shame with which she thought to hide the poverty of her child in all the grand qualities which she herself possessed unconsciously and which she set so high a value upon in others"], ["15", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>For seeing my really tender, said missus clark's manner to her daughter the shame with which she helped hide the poverty of her child in all the grander qualities that she herself possessed unconsciously and which she set so high a value upon with others.<|im_end|>", 0.2842099964618683, 2.151641607284546, "which the uneasy tenderness of missus thornton's manner to her daughter the shame with which she thought to hide the poverty of her child in all the grand qualities which she herself possessed unconsciously and which she set so high a value upon in others"], ["15", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>For she had a really tenderness of disposition and management for her daughter, ashamed that she helped to hide the poverty of her child in all the grand qualities which she herself possessed unconsciously, and which she set so high a value upon with others.<|im_end|>", -0.01078671682626009, -0.007967192679643631, "which the uneasy tenderness of missus thornton's manner to her daughter the shame with which she thought to hide the poverty of her child in all the grand qualities which she herself possessed unconsciously and which she set so high a value upon in others"], ["15", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>For she had a really tender sense of Mrs holmes's management of her daughter, ashamed that she helped to hide the poverty of her child in all the grand qualities which she herself possessed unconsciously and which she set so high a value upon with others.<|im_end|>", -0.11140192300081253, -0.7445499300956726, "which the uneasy tenderness of missus thornton's manner to her daughter the shame with which she thought to hide the poverty of her child in all the grand qualities which she herself possessed unconsciously and which she set so high a value upon in others"], ["15", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>For she had a really tender sense of mrs fleming's management of her daughter, ashamed that she helped to hide the poverty of her child in all the grander qualities which she herself possessed unconsciously and which she set so high a value upon with others.<|im_end|>", -0.18237683176994324, -1.2641422748565674, "which the uneasy tenderness of missus thornton's manner to her daughter the shame with which she thought to hide the poverty of her child in all the grand qualities which she herself possessed unconsciously and which she set so high a value upon in others"], ["15", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>For steam and breathing temperance said missus fleming's manager her daughter ashamed that she helped hide the poverty of her child in all the grander qualities which she herself possessed unconsciously at first she set so high a value upon the pleasures<|box_start|><|im_end|>", -0.16693364083766937, -1.1510859727859497, "which the uneasy tenderness of missus thornton's manner to her daughter the shame with which she thought to hide the poverty of her child in all the grand qualities which she herself possessed unconsciously and which she set so high a value upon in others"], ["15", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>For she had a pleasing temper, said missus holmes's manager of her daughter, ashamed that she helped to hide the poverty of her child in all the grander qualities which she herself possessed unconsciously and which she set so high a value upon with others.<|im_end|>", -0.12878626585006714, -0.8718170523643494, "which the uneasy tenderness of missus thornton's manner to her daughter the shame with which she thought to hide the poverty of her child in all the grand qualities which she herself possessed unconsciously and which she set so high a value upon in others"], ["15", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>For she had a pleasing temper, said missus holmes's manager of her daughter ashamed that she helped to hide the poverty of her child in all the grand qualities which she herself possessed unconsciously and which she set so high a value upon with others.<|im_end|>", 0.05193726718425751, 0.45122188329696655, "which the uneasy tenderness of missus thornton's manner to her daughter the shame with which she thought to hide the poverty of her child in all the grand qualities which she herself possessed unconsciously and which she set so high a value upon in others"], ["15", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>And had promised to enter the eternal city in my next episcopal abbatial name.<|im_end|>", -0.288534939289093, 0.34273386001586914, "And had promised to lend her the eternal city and my recipe for rabbit mayonnaise."], ["15", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>And had promised to enter the eternal city in my nephew's behalf at mayonnaise.<|im_end|>", -0.062477611005306244, 1.5248231887817383, "And had promised to lend her the eternal city and my recipe for rabbit mayonnaise."], ["15", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>And had promised to enter the eternal city in my own sepulchre, provided me a name.<|im_end|>", -0.6080390810966492, -1.3280036449432373, "And had promised to lend her the eternal city and my recipe for rabbit mayonnaise."], ["15", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>And had promised to enter the eternal city and martyrship provided me a name.<|im_end|>", -0.28105244040489197, 0.38186103105545044, "And had promised to lend her the eternal city and my recipe for rabbit mayonnaise."], ["15", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>And had promised to enter the eternal city in my embassy provided me a name.<|im_end|>", -0.4495788514614105, -0.4993901252746582, "And had promised to lend her the eternal city and my recipe for rabbit mayonnaise."], ["15", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>And had promised to enter the eternal city in my nephew's behalf at mayonnaise.<|im_end|>", -0.062477611005306244, 1.5248231887817383, "And had promised to lend her the eternal city and my recipe for rabbit mayonnaise."], ["15", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>And had promised to enter the eternal city and martyrship provided me a name.<|im_end|>", -0.28105244040489197, 0.38186103105545044, "And had promised to lend her the eternal city and my recipe for rabbit mayonnaise."], ["15", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>And had promised to enter the eternal city in my next episcopal visit made there.<|im_end|>", -0.4480052590370178, -0.4911615550518036, "And had promised to lend her the eternal city and my recipe for rabbit mayonnaise."], ["15", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>And had promised to enter the eternal city and martyrship provided me a name.<|im_end|>", -0.28105244040489197, 0.38186103105545044, "And had promised to lend her the eternal city and my recipe for rabbit mayonnaise."], ["15", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>And had promised to enter the eternal city in my next epistle that it may remain.<|im_end|>", -0.6017347574234009, -1.2950372695922852, "And had promised to lend her the eternal city and my recipe for rabbit mayonnaise."], ["15", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>And had promised to enter the eternal city and martyrship provided me a name.<|im_end|>", -0.28105244040489197, 0.38186103105545044, "And had promised to lend her the eternal city and my recipe for rabbit mayonnaise."], ["15", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>And had promised to enter the eternal city in my nephew's behalf at many a name.<|im_end|>", -0.6038755774497986, -1.30623197555542, "And had promised to lend her the eternal city and my recipe for rabbit mayonnaise."]]}
wandb/run-20260417_123237-3h84yfea/files/media/table/completions_9_ec21142175e3781c9ddd.table.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"columns": ["step", "prompt", "completion", "ASRWerSubLenCmpHalluDirtyV56", "advantages", "solution"], "data": [["20", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>We looked upon them and we laughed, and said fear nothing my brothers, there is a great power in these wires but this power is tamed it is yours we give it to you still they would not move.<|im_end|>", 0.7686349749565125, 0.5085489153862, "we looked upon them and we laughed and said fear nothing our brothers there is a great power in these wires but this power is tamed it is yours we give it to you still they would not move"], ["20", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>We looked upon them and we laughed, and said fear nothing my brothers there is a great power in these wires but this power is tamed it is yours we give it to you still they would not move.<|im_end|>", 0.8261563181877136, 0.8900229930877686, "we looked upon them and we laughed and said fear nothing our brothers there is a great power in these wires but this power is tamed it is yours we give it to you still they would not move"], ["20", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>We looked upon them and we laughed, and said fear nothing my brothers, there is a great power in these wires, but this power is tamed. It is yours. We give it to you still they would not move.<|im_end|>", 0.5813714861869812, -0.7333583831787109, "we looked upon them and we laughed and said fear nothing our brothers there is a great power in these wires but this power is tamed it is yours we give it to you still they would not move"], ["20", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>We looked upon them and we laughed, and said fear nothing my brothers there is a great power in these wires but this power is tamed it is yours we give it to you still they would not move.<|im_end|>", 0.8261563181877136, 0.8900229930877686, "we looked upon them and we laughed and said fear nothing our brothers there is a great power in these wires but this power is tamed it is yours we give it to you still they would not move"], ["20", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>We looked upon them and we laughed, and said fear nothing my brothers there is a great power in these wires but this power is tamed it is yours we give it to you still they would not move.<|im_end|>", 0.8261563181877136, 0.8900229930877686, "we looked upon them and we laughed and said fear nothing our brothers there is a great power in these wires but this power is tamed it is yours we give it to you still they would not move"], ["20", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>We looked upon them and we laughed, and said fear nothing my brothers, there is a great power in these wilds, but this power is tamed. It is yours. We give it to you still they would not move.<|im_end|>", 0.5788635611534119, -0.7499906420707703, "we looked upon them and we laughed and said fear nothing our brothers there is a great power in these wires but this power is tamed it is yours we give it to you still they would not move"], ["20", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>We looked upon them and we laughed, and said, fear nothing, my brothers. There is a great power in these wires, but this power is tamed. It is yours. We give it to you still they would not move.<|im_end|>", 0.4414002299308777, -1.6616296768188477, "we looked upon them and we laughed and said fear nothing our brothers there is a great power in these wires but this power is tamed it is yours we give it to you still they would not move"], ["20", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>We looked upon them and we laughed, and said, fear nothing my brothers, there is a great power in these wires but this power is tamed it is yours, we give it to you still they would not move.<|im_end|>", 0.6516913175582886, -0.26700636744499207, "we looked upon them and we laughed and said fear nothing our brothers there is a great power in these wires but this power is tamed it is yours we give it to you still they would not move"], ["20", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>We looked upon them and we laughed, and said fear nothing my brothers there is a great power in these wires but this power is tamed it is yours we give it to you still they would not move.<|im_end|>", 0.8261563181877136, 0.8900229930877686, "we looked upon them and we laughed and said fear nothing our brothers there is a great power in these wires but this power is tamed it is yours we give it to you still they would not move"], ["20", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>We looked upon them and we laughed, and said fear nothing, my brothers, there is a great power in these wires but this power is tamed it is yours we give it to you still they would not move.<|im_end|>", 0.7117764949798584, 0.13147078454494476, "we looked upon them and we laughed and said fear nothing our brothers there is a great power in these wires but this power is tamed it is yours we give it to you still they would not move"], ["20", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>We looked upon them and we laughed, and said fear nothing my brothers there is a great power in these wires but this power is tamed it is yours we give it to you still they would not move.<|im_end|>", 0.8261563181877136, 0.8900229930877686, "we looked upon them and we laughed and said fear nothing our brothers there is a great power in these wires but this power is tamed it is yours we give it to you still they would not move"], ["20", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>We looked upon them and we laughed, and said, fear nothing, my brothers. There is a great power in these wilds, but this power is tamed. It is yours. We give it to you still they would not move.<|im_end|>", 0.43890881538391113, -1.6781524419784546, "we looked upon them and we laughed and said fear nothing our brothers there is a great power in these wires but this power is tamed it is yours we give it to you still they would not move"], ["20", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>At such a moment, this yet undiscovered and peculiar world was in no ordinary shape, setting in motion incalculable weapons of force and agencies for the first time man had command of his native supply of electricity without thought or effort.<|im_end|>", -0.12373896688222885, 0.08507958054542542, "at such a moment this gift of despoiled italy to the world was a noble revenge setting in motion incalculable beneficent forces and agencies for the first time man had command of a steady supply of electricity without toil or effort"], ["20", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>At such a moment, this yet undiscovered and peculiar world was in no words of change setting in motion incalculable weapons and forces and agencies for the first time man had command of his daily supply of electricity without trouble or effort.<|im_end|>", -0.1656464785337448, -0.35089585185050964, "at such a moment this gift of despoiled italy to the world was a noble revenge setting in motion incalculable beneficent forces and agencies for the first time man had command of a steady supply of electricity without toil or effort"], ["20", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>At such a moment, this yet undiscovered and peculiar world was in no ordinary shape, setting in motion incalculable weapons and forces and agencies for the first time man had command of his native supply of electricity without thought or effort.<|im_end|>", -0.054759737104177475, 0.8026895523071289, "at such a moment this gift of despoiled italy to the world was a noble revenge setting in motion incalculable beneficent forces and agencies for the first time man had command of a steady supply of electricity without toil or effort"], ["20", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>At such a moment, this yet undiscovered and peculiar world was in no ordinary chair setting in motion incalculable weapons of force and agencies for the first time man had command of his native supply of electricity without thought or effort.<|im_end|>", -0.12419147044420242, 0.08037205785512924, "at such a moment this gift of despoiled italy to the world was a noble revenge setting in motion incalculable beneficent forces and agencies for the first time man had command of a steady supply of electricity without toil or effort"], ["20", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>At such a moment, this yet undiscovered and peculiar world was in no way diminished, setting in motion incalculable weapons and forces and agencies for the first time man had command of his daily supply of electricity without thought or effort.<|im_end|>", -0.05371581390500069, 0.8135498762130737, "at such a moment this gift of despoiled italy to the world was a noble revenge setting in motion incalculable beneficent forces and agencies for the first time man had command of a steady supply of electricity without toil or effort"], ["20", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>At such a moment, this yet undiscovered and peculiar world was in no little danger, setting in motion incalculable weapons of force and agencies for the first time man had command over things supplied with electricity without thought or effort.<|im_end|>", -0.3379965126514435, -2.1439008712768555, "at such a moment this gift of despoiled italy to the world was a noble revenge setting in motion incalculable beneficent forces and agencies for the first time man had command of a steady supply of electricity without toil or effort"], ["20", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>At such a moment, this vehicle of the mechanical world was in no other language setting in motion incalculable weapons and forces and agencies for the first time man had command of his native supply of electricity without thought or effort.<|im_end|>", 0.018295863643288612, 1.5627073049545288, "at such a moment this gift of despoiled italy to the world was a noble revenge setting in motion incalculable beneficent forces and agencies for the first time man had command of a steady supply of electricity without toil or effort"], ["20", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>At such a moment, this yet undiscovered and peculiar world was in no ordinary shape, setting in motion incalculable weapons of force and agencies for the first time man had command of his native supply of electricity without thought or effort.<|im_end|>", -0.12373896688222885, 0.08507958054542542, "at such a moment this gift of despoiled italy to the world was a noble revenge setting in motion incalculable beneficent forces and agencies for the first time man had command of a steady supply of electricity without toil or effort"], ["20", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>At such a moment, this yet undiscovered and familiar world was in no ordinary shape, setting in motion incalculable weapons of force and agencies. For the first time man had command of his daily supply of electricity without trouble or effort.<|im_end|>", -0.19637031853199005, -0.6705244779586792, "at such a moment this gift of despoiled italy to the world was a noble revenge setting in motion incalculable beneficent forces and agencies for the first time man had command of a steady supply of electricity without toil or effort"], ["20", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>At such a moment, this yet undiscovered and familiar world was in no ordinary shape, setting in motion incalculable weapons and forces and agencies for the first time man had command of his native supply of electricity without thought or effort.<|im_end|>", -0.053767330944538116, 0.8130138516426086, "at such a moment this gift of despoiled italy to the world was a noble revenge setting in motion incalculable beneficent forces and agencies for the first time man had command of a steady supply of electricity without toil or effort"], ["20", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>At such a moment, this yet undiscovered and peculiar world was in no ordinary shape setting in motion incalculable weapons of force and agencies for the first time man had command of his native supply of electricity without thought or effort.<|im_end|>", -0.12297827005386353, 0.09299331903457642, "at such a moment this gift of despoiled italy to the world was a noble revenge setting in motion incalculable beneficent forces and agencies for the first time man had command of a steady supply of electricity without toil or effort"], ["20", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>At such a moment, this yet undiscovered and familiar world was in no word of language setting in motion incalculable weapons of force and agencies for the first time man had command of his native supply of electricity without thought or effort.<|im_end|>", -0.24439725279808044, -1.1701619625091553, "at such a moment this gift of despoiled italy to the world was a noble revenge setting in motion incalculable beneficent forces and agencies for the first time man had command of a steady supply of electricity without toil or effort"], ["20", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>He repeated and they're dashed out of the turnpike splendid span black horses attached to a carriage having long run s r s in gilt letters on the fender at the door two girls stepped up in the car with the carriage the old woman had entered and taken her seat<|im_end|>", 0.19381928443908691, 0.380490243434906, "he repeated and there dashed up to the curb a splendid span of black horses attached to a carriage having the monogram c r s in gilt letters on the panel of the door two girls stepped out of the crowd towards the carriage the older one had entered and taken her seat"], ["20", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>He repeated, and there dashed out of the nursery a splendid span black horses attached to a carriage having long written c r s in gilt letters on the handle of that order two girls stepped out at the car window with the carriage, the old woman had entered and taken her seat.<|im_end|>", 0.14365018904209137, -0.12923574447631836, "he repeated and there dashed up to the curb a splendid span of black horses attached to a carriage having the monogram c r s in gilt letters on the panel of the door two girls stepped out of the crowd towards the carriage the older one had entered and taken her seat"], ["20", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>He repeated, and there dashed after them a splendid span of black horses attached to a carriage having long written c r s in gilt letters on the fanlight door two girls stepped out at the front door with the carriage. The old woman had entered, taken her seat.<|im_end|>", 0.05467502027750015, -1.0332376956939697, "he repeated and there dashed up to the curb a splendid span of black horses attached to a carriage having the monogram c r s in gilt letters on the panel of the door two girls stepped out of the crowd towards the carriage the older one had entered and taken her seat"], ["20", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>He repeated and they're dashed out into the nursery as a splendid span of black horses attached to a carriage having long running c r s in gilt letters on the fender at the door two girls stepped out of the car with the carriage, the old woman had entered and taken her seat.<|im_end|>", 0.294100284576416, 1.399361252784729, "he repeated and there dashed up to the curb a splendid span of black horses attached to a carriage having the monogram c r s in gilt letters on the panel of the door two girls stepped out of the crowd towards the carriage the older one had entered and taken her seat"], ["20", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>He repeated and they're dashed out of the nursery a splendid span black horses attached to a carriage having long running c r s in gilt letters on the front of that order two girls stepped up into the crowded rear of the carriage, the old woman had entered taking her seat.<|im_end|>", -0.00651371106505394, -1.654924988746643, "he repeated and there dashed up to the curb a splendid span of black horses attached to a carriage having the monogram c r s in gilt letters on the panel of the door two girls stepped out of the crowd towards the carriage the older one had entered and taken her seat"], ["20", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>He repeated, and there dashed out through the nursery a splendid span of black horses attached to a carriage having long red c r s in gilt letters on the handle at the door. Two girls stepped up to the carriageway with the carriage. The old woman had entered and taken her seat.<|im_end|>", 0.1829727590084076, 0.2702878415584564, "he repeated and there dashed up to the curb a splendid span of black horses attached to a carriage having the monogram c r s in gilt letters on the panel of the door two girls stepped out of the crowd towards the carriage the older one had entered and taken her seat"], ["20", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>He repeated, and they're dashed up through the turnpike splendid span of black horses attached to a carriage having long running c r s in gilt letters on the fan of that order two girls stepped out into the crowd towards the carriage, the old woman had entered and taken her seat.<|im_end|>", 0.2951398491859436, 1.4099233150482178, "he repeated and there dashed up to the curb a splendid span of black horses attached to a carriage having the monogram c r s in gilt letters on the panel of the door two girls stepped out of the crowd towards the carriage the older one had entered and taken her seat"], ["20", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>He repeated and they're dashed out into the nursery, a splendid span of black horses attached to a carriage having long running c r s in gilt letters on the fender at the door. Two girls stepped out in the corral towards the carriage. The old woman had entered and taken her seat.<|im_end|>", 0.28599315881729126, 1.3169915676116943, "he repeated and there dashed up to the curb a splendid span of black horses attached to a carriage having the monogram c r s in gilt letters on the panel of the door two girls stepped out of the crowd towards the carriage the older one had entered and taken her seat"], ["20", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>He repeated, and there dashed out of the nursery a splendid span of black horses attached to a carriage having long running s r s in gilt letters on the front of that order two girls stepped up into the rear end of the carriage, the old woman had entered and taken her seat.<|im_end|>", 0.08877895027399063, -0.6867362856864929, "he repeated and there dashed up to the curb a splendid span of black horses attached to a carriage having the monogram c r s in gilt letters on the panel of the door two girls stepped out of the crowd towards the carriage the older one had entered and taken her seat"], ["20", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>He repeated, and there dashed out of the nursery a splendid span black horses attached to a carriage having on the bonnet c r s in gilt letters on a fan flap door two girls stepped up to the crowd around the carriage. The old woman had entered and taken her seat.<|im_end|>", 0.15423451364040375, -0.021697325631976128, "he repeated and there dashed up to the curb a splendid span of black horses attached to a carriage having the monogram c r s in gilt letters on the panel of the door two girls stepped out of the crowd towards the carriage the older one had entered and taken her seat"], ["20", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>He repeated and they're dashed out of the nursery with a splendid span of black horses attached to a carriage having long running c r s in gilt letters on the front of that order two girls stepped up at the garaband door of the carriage, the old woman had entered and taken her seat.<|im_end|>", 0.09735386073589325, -0.5996138453483582, "he repeated and there dashed up to the curb a splendid span of black horses attached to a carriage having the monogram c r s in gilt letters on the panel of the door two girls stepped out of the crowd towards the carriage the older one had entered and taken her seat"], ["20", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>He repeated and they're dashed out of the nursery, splendid span black horses attached to a carriage having long running c r s in gilt letters on the fan flap door two girls stepped up into the carriagewith the old woman had entered and taken her seat<|im_end|>", 0.09223616868257523, -0.6516103744506836, "he repeated and there dashed up to the curb a splendid span of black horses attached to a carriage having the monogram c r s in gilt letters on the panel of the door two girls stepped out of the crowd towards the carriage the older one had entered and taken her seat"], ["20", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>The young inventor turned his face aside and then glanced round the dark barn in alarm. The cat pushed out from behind him with a great low paw between its jaws, and it was ugly. Sh sh said a low murmur of whisper.<|im_end|>", -1.1028889417648315, -0.7121061682701111, "They looked into each other's frightened faces, and then glanced around the dark barn in alarm. An old cap pushed up through the hay. Then a weak little cough betrayed jonesy. He had followed them. Sh he said in a warning whisper."], ["20", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>And looked into each other's frightened faces, and then glanced round the dark barn in alarm. He pushed up his collar with a great low cough between jerks of breath, and held out his hand. Sh sh said an old woman whispering.<|im_end|>", -0.6284806728363037, 1.885280966758728, "They looked into each other's frightened faces, and then glanced around the dark barn in alarm. An old cap pushed up through the hay. Then a weak little cough betrayed jonesy. He had followed them. Sh he said in a warning whisper."], ["20", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Then he leaned over to his sister, and they kissed again, and then glanced round the dark barn in the mar. Cuthbert's head fell, and a great blow passed between them. And it was heavy, sh she said aloud with a whisper.<|im_end|>", -1.1564602851867676, -1.0054094791412354, "They looked into each other's frightened faces, and then glanced around the dark barn in alarm. An old cap pushed up through the hay. Then a weak little cough betrayed jonesy. He had followed them. Sh he said in a warning whisper."], ["20", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>The little angel just stared at his feet, and then glanced round the dark barn in alarm. He pushed up his heels with a great blow, caught betwixt arm and leg, and had hardly been shuffling on the floor when he whispered.<|im_end|>", -1.1646636724472046, -1.0503231287002563, "They looked into each other's frightened faces, and then glanced around the dark barn in alarm. An old cap pushed up through the hay. Then a weak little cough betrayed jonesy. He had followed them. Sh he said in a warning whisper."], ["20", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>The little angel touched his great white face and then glanced round the dark barn in alarm, pushed up from under it with a great blow of paws that dragged him back again. And he had said something sh she flamed out a whisper.<|im_end|>", -1.1615231037139893, -1.0331284999847412, "They looked into each other's frightened faces, and then glanced around the dark barn in alarm. An old cap pushed up through the hay. Then a weak little cough betrayed jonesy. He had followed them. Sh he said in a warning whisper."], ["20", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Then he looked into each of the three faces and then glanced round the dark barn in alarm, pushed out his head and with great little hops retreated joyfully away from the room sh she said a murmur whispered.<|im_end|>", -0.9255474805831909, 0.2588390111923218, "They looked into each other's frightened faces, and then glanced around the dark barn in alarm. An old cap pushed up through the hay. Then a weak little cough betrayed jonesy. He had followed them. Sh he said in a warning whisper."], ["20", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>The little angel just stared at his hand and then glanced round the dark barn in alarm, pushed up her hood and a great low cough betrayed joy and fear. Sh sh sh said another voice.<|im_end|>", -0.9503790140151978, 0.12288626283407211, "They looked into each other's frightened faces, and then glanced around the dark barn in alarm. An old cap pushed up through the hay. Then a weak little cough betrayed jonesy. He had followed them. Sh he said in a warning whisper."], ["20", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>And looked into each other's frightened faces, and then glanced round the dark barn in alarm. Pritchett quickly hid his great blue paws between his arms, and he did a little bit sh sh said a low voice.<|im_end|>", -0.6836804151535034, 1.5830621719360352, "They looked into each other's frightened faces, and then glanced around the dark barn in alarm. An old cap pushed up through the hay. Then a weak little cough betrayed jonesy. He had followed them. Sh he said in a warning whisper."], ["20", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>And looking down at his frightened face, and then glanced round the dark barn in alarm. He pushed up slowly from a great low cask between two walls and looked wildly around him. Sh said another voice.<|im_end|>", -0.9896582961082458, -0.09216795861721039, "They looked into each other's frightened faces, and then glanced around the dark barn in alarm. An old cap pushed up through the hay. Then a weak little cough betrayed jonesy. He had followed them. Sh he said in a warning whisper."], ["20", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>The little angel just stared at her and then glanced round the dark barn in alarm, but pushed up quickly when a great blow passed between the two men. And it was somebody sh said another voice.<|im_end|>", -1.0897308588027954, -0.640065610408783, "They looked into each other's frightened faces, and then glanced around the dark barn in alarm. An old cap pushed up through the hay. Then a weak little cough betrayed jonesy. He had followed them. Sh he said in a warning whisper."], ["20", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>And looked into each of the great windows, and then glanced round the dark barn in the yard. He pushed up his sleeve, and with a great low cough betrayed joy, and asked happily shh, said another voice quietly.<|im_end|>", -0.8186123371124268, 0.8443093299865723, "They looked into each other's frightened faces, and then glanced around the dark barn in alarm. An old cap pushed up through the hay. Then a weak little cough betrayed jonesy. He had followed them. Sh he said in a warning whisper."], ["20", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>And looking down at his frightened face again, and then glanced round the dark barn in alarm. He pushed up slowly from the great low cask between two old men. And he saw a blue moon sh she said no one whispered.<|im_end|>", -1.0022618770599365, -0.16117261350154877, "They looked into each other's frightened faces, and then glanced around the dark barn in alarm. An old cap pushed up through the hay. Then a weak little cough betrayed jonesy. He had followed them. Sh he said in a warning whisper."]]}
wandb/run-20260417_123237-3h84yfea/files/output.log ADDED
@@ -0,0 +1,326 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ wandb: Detected [openai] in use.
2
+ wandb: Use W&B Weave for improved LLM call tracing. Install Weave with `pip install weave` then add `import weave` to the top of your script.
3
+ wandb: For more information, check out the docs at: https://weave-docs.wandb.ai/
4
+ Train: 0%| | 0/9327 [00:00<?, ?it/s]Could not estimate the number of tokens of the input, floating-point operations will not be computed
5
+ [DEBUG generate] shape= (24, 245) last_col_pad_cnt= 0 first_col_pad_cnt= 12
6
+ [DEBUG _encode] has_resp= True prompt_len= 245 resp_len= 53 full_len= 298 label_non_ignore= 53
7
+ [DEBUG _encode] has_resp= True prompt_len= 245 resp_len= 56 full_len= 301 label_non_ignore= 56
8
+ [DEBUG _encode] has_resp= True prompt_len= 245 resp_len= 52 full_len= 297 label_non_ignore= 52
9
+ [DEBUG _encode] has_resp= True prompt_len= 245 resp_len= 53 full_len= 298 label_non_ignore= 53
10
+ [DEBUG _encode] has_resp= True prompt_len= 245 resp_len= 58 full_len= 303 label_non_ignore= 58
11
+ [DEBUG _encode] has_resp= True prompt_len= 245 resp_len= 55 full_len= 300 label_non_ignore= 55
12
+ [DEBUG _encode] has_resp= True prompt_len= 245 resp_len= 56 full_len= 301 label_non_ignore= 56
13
+ [DEBUG _encode] has_resp= True prompt_len= 245 resp_len= 61 full_len= 306 label_non_ignore= 61
14
+ [DEBUG _encode] has_resp= True prompt_len= 245 resp_len= 55 full_len= 300 label_non_ignore= 55
15
+ [DEBUG _encode] has_resp= True prompt_len= 245 resp_len= 50 full_len= 295 label_non_ignore= 50
16
+ [DEBUG generate] shape= (24, 245) last_col_pad_cnt= 0 first_col_pad_cnt= 12
17
+ [DEBUG generate] shape= (24, 235) last_col_pad_cnt= 0 first_col_pad_cnt= 12
18
+ [DEBUG generate] shape= (24, 235) last_col_pad_cnt= 0 first_col_pad_cnt= 12
19
+ [DEBUG generate] shape= (24, 249) last_col_pad_cnt= 0 first_col_pad_cnt= 12
20
+ Train: 0%| | 8/9327 [07:40<146:43:24, 56.68s/it]
21
+ {'loss': 0.00064715, 'grad_norm': 0.43327886, 'learning_rate': 1.8e-07, 'completions/mean_length': 48.90104294, 'completions/min_length': 35.25, 'completions/max_length': 61.25, 'completions/clipped_ratio': 0.0, 'reward': -0.42871299, 'reward_std': 0.16135792, 'frac_reward_zero_std': 0.0, 'rewards/ASRWerSubLenCmpHalluDirtyV56/mean': -0.42871299, 'rewards/ASRWerSubLenCmpHalluDirtyV56/std': 0.28526043, 'kl': 0.0, 'clip_ratio/low_mean': 0.0, 'clip_ratio/low_min': 0.0, 'clip_ratio/high_mean': 0.0, 'clip_ratio/high_max': 0.0, 'clip_ratio/region_mean': 0.0, 'step_time': 32.50056268, 'epoch': 0.0, 'global_step/max_steps': '1/9327', 'elapsed_time': '1m 5s', 'remaining_time': '7d 1h 23m 55s', 'memory(GiB)': 7.93, 'train_speed(s/it)': 65.390893}
22
+ [DEBUG generate] shape= (24, 250) last_col_pad_cnt= 0 first_col_pad_cnt= 0
23
+ [DEBUG generate] shape= (24, 250) last_col_pad_cnt= 0 first_col_pad_cnt= 0
24
+ [DEBUG generate] shape= (24, 226) last_col_pad_cnt= 0 first_col_pad_cnt= 12
25
+ [DEBUG generate] shape= (24, 226) last_col_pad_cnt= 0 first_col_pad_cnt= 12
26
+ [DEBUG generate] shape= (24, 249) last_col_pad_cnt= 0 first_col_pad_cnt= 12
27
+ [DEBUG generate] shape= (24, 249) last_col_pad_cnt= 0 first_col_pad_cnt= 12
28
+ [DEBUG generate] shape= (24, 255) last_col_pad_cnt= 0 first_col_pad_cnt= 12
29
+ [DEBUG generate] shape= (24, 255) last_col_pad_cnt= 0 first_col_pad_cnt= 12
30
+ [DEBUG generate] shape= (24, 257) last_col_pad_cnt= 0 first_col_pad_cnt= 12
31
+ [DEBUG generate] shape= (24, 257) last_col_pad_cnt= 0 first_col_pad_cnt= 12
32
+ [DEBUG generate] shape= (24, 244) last_col_pad_cnt= 0 first_col_pad_cnt= 12
33
+ [DEBUG generate] shape= (24, 244) last_col_pad_cnt= 0 first_col_pad_cnt= 12
34
+ [DEBUG generate] shape= (24, 253) last_col_pad_cnt= 0 first_col_pad_cnt= 12
35
+ [DEBUG generate] shape= (24, 253) last_col_pad_cnt= 0 first_col_pad_cnt= 12
36
+ [DEBUG generate] shape= (24, 254) last_col_pad_cnt= 0 first_col_pad_cnt= 12
37
+ [DEBUG generate] shape= (24, 254) last_col_pad_cnt= 0 first_col_pad_cnt= 12
38
+ {'loss': 0.00332408, 'grad_norm': 0.37274894, 'learning_rate': 8.9e-07, 'completions/mean_length': 51.19921994, 'completions/min_length': 34.0, 'completions/max_length': 64.6875, 'completions/clipped_ratio': 0.0, 'reward': -0.02796031, 'reward_std': 0.15601904, 'frac_reward_zero_std': 0.0, 'rewards/ASRWerSubLenCmpHalluDirtyV56/mean': -0.02796032, 'rewards/ASRWerSubLenCmpHalluDirtyV56/std': 0.3970435, 'kl': 0.00452624, 'clip_ratio/low_mean': 0.01082122, 'clip_ratio/low_min': 0.0055485, 'clip_ratio/high_mean': 0.00634016, 'clip_ratio/high_max': 0.0085038, 'clip_ratio/region_mean': 0.01716138, 'step_time': 27.27283109, 'epoch': 0.0, 'global_step/max_steps': '5/9327', 'elapsed_time': '4m 49s', 'remaining_time': '6d 5h 27m 51s', 'memory(GiB)': 8.23, 'train_speed(s/it)': 57.720515}
39
+ [DEBUG generate] shape= (24, 256) last_col_pad_cnt= 0 first_col_pad_cnt= 12
40
+ [DEBUG generate] shape= (24, 256) last_col_pad_cnt= 0 first_col_pad_cnt= 12
41
+ [DEBUG generate] shape= (24, 246) last_col_pad_cnt= 0 first_col_pad_cnt= 12
42
+ [DEBUG generate] shape= (24, 246) last_col_pad_cnt= 0 first_col_pad_cnt= 12
43
+ [DEBUG generate] shape= (24, 135) last_col_pad_cnt= 0 first_col_pad_cnt= 12
44
+ [DEBUG generate] shape= (24, 135) last_col_pad_cnt= 0 first_col_pad_cnt= 12
45
+ [DEBUG generate] shape= (24, 225) last_col_pad_cnt= 0 first_col_pad_cnt= 12
46
+ [DEBUG generate] shape= (24, 225) last_col_pad_cnt= 0 first_col_pad_cnt= 12
47
+ [DEBUG generate] shape= (24, 244) last_col_pad_cnt= 0 first_col_pad_cnt= 0
48
+ [DEBUG generate] shape= (24, 244) last_col_pad_cnt= 0 first_col_pad_cnt= 0
49
+ [DEBUG generate] shape= (24, 240) last_col_pad_cnt= 0 first_col_pad_cnt= 12
50
+ [DEBUG generate] shape= (24, 240) last_col_pad_cnt= 0 first_col_pad_cnt= 12
51
+ [DEBUG generate] shape= (24, 244) last_col_pad_cnt= 0 first_col_pad_cnt= 12
52
+ [DEBUG generate] shape= (24, 244) last_col_pad_cnt= 0 first_col_pad_cnt= 12
53
+ [DEBUG generate] shape= (24, 246) last_col_pad_cnt= 0 first_col_pad_cnt= 12
54
+ [DEBUG generate] shape= (24, 246) last_col_pad_cnt= 0 first_col_pad_cnt= 12
55
+ [DEBUG generate] shape= (24, 236) last_col_pad_cnt= 0 first_col_pad_cnt= 12
56
+ [DEBUG generate] shape= (24, 236) last_col_pad_cnt= 0 first_col_pad_cnt= 12
57
+ [DEBUG generate] shape= (24, 238) last_col_pad_cnt= 0 first_col_pad_cnt= 12
58
+ [DEBUG generate] shape= (24, 238) last_col_pad_cnt= 0 first_col_pad_cnt= 12
59
+ {'loss': 0.00474931, 'grad_norm': 0.40048897, 'learning_rate': 1.79e-06, 'completions/mean_length': 51.25104275, 'completions/min_length': 35.8, 'completions/max_length': 65.4, 'completions/clipped_ratio': 0.0, 'reward': -0.01675091, 'reward_std': 0.17052342, 'frac_reward_zero_std': 0.0, 'rewards/ASRWerSubLenCmpHalluDirtyV56/mean': -0.0167509, 'rewards/ASRWerSubLenCmpHalluDirtyV56/std': 0.47662268, 'kl': 0.00584314, 'clip_ratio/low_mean': 0.0141277, 'clip_ratio/low_min': 0.0085519, 'clip_ratio/high_mean': 0.00913547, 'clip_ratio/high_max': 0.01304741, 'clip_ratio/region_mean': 0.02326317, 'step_time': 27.57334645, 'epoch': 0.0, 'global_step/max_steps': '10/9327', 'elapsed_time': '9m 28s', 'remaining_time': '6d 2h 53m 31s', 'memory(GiB)': 8.23, 'train_speed(s/it)': 56.757666}
60
+ [DEBUG generate] shape= (24, 242) last_col_pad_cnt= 0 first_col_pad_cnt= 12
61
+ [DEBUG generate] shape= (24, 242) last_col_pad_cnt= 0 first_col_pad_cnt= 12
62
+ [DEBUG generate] shape= (24, 241) last_col_pad_cnt= 0 first_col_pad_cnt= 0
63
+ [DEBUG generate] shape= (24, 241) last_col_pad_cnt= 0 first_col_pad_cnt= 0
64
+ [DEBUG generate] shape= (24, 245) last_col_pad_cnt= 0 first_col_pad_cnt= 12
65
+ [DEBUG generate] shape= (24, 245) last_col_pad_cnt= 0 first_col_pad_cnt= 12
66
+ [DEBUG generate] shape= (24, 246) last_col_pad_cnt= 0 first_col_pad_cnt= 12
67
+ [DEBUG generate] shape= (24, 246) last_col_pad_cnt= 0 first_col_pad_cnt= 12
68
+ [DEBUG generate] shape= (24, 257) last_col_pad_cnt= 0 first_col_pad_cnt= 12
69
+ [DEBUG generate] shape= (24, 257) last_col_pad_cnt= 0 first_col_pad_cnt= 12
70
+ [DEBUG generate] shape= (24, 252) last_col_pad_cnt= 0 first_col_pad_cnt= 12
71
+ [DEBUG generate] shape= (24, 252) last_col_pad_cnt= 0 first_col_pad_cnt= 12
72
+ [DEBUG generate] shape= (24, 248) last_col_pad_cnt= 0 first_col_pad_cnt= 12
73
+ [DEBUG generate] shape= (24, 248) last_col_pad_cnt= 0 first_col_pad_cnt= 12
74
+ [DEBUG generate] shape= (24, 239) last_col_pad_cnt= 0 first_col_pad_cnt= 12
75
+ [DEBUG generate] shape= (24, 239) last_col_pad_cnt= 0 first_col_pad_cnt= 12
76
+ [DEBUG generate] shape= (24, 247) last_col_pad_cnt= 0 first_col_pad_cnt= 12
77
+ [DEBUG generate] shape= (24, 247) last_col_pad_cnt= 0 first_col_pad_cnt= 12
78
+ [DEBUG generate] shape= (24, 246) last_col_pad_cnt= 0 first_col_pad_cnt= 0
79
+ [DEBUG generate] shape= (24, 246) last_col_pad_cnt= 0 first_col_pad_cnt= 0
80
+ {'loss': 0.00394418, 'grad_norm': 0.42660096, 'learning_rate': 2.68e-06, 'completions/mean_length': 49.16666756, 'completions/min_length': 35.4, 'completions/max_length': 62.85, 'completions/clipped_ratio': 0.0, 'reward': 0.02952445, 'reward_std': 0.14753249, 'frac_reward_zero_std': 0.0, 'rewards/ASRWerSubLenCmpHalluDirtyV56/mean': 0.02952445, 'rewards/ASRWerSubLenCmpHalluDirtyV56/std': 0.38754931, 'kl': 0.00462258, 'clip_ratio/low_mean': 0.01453043, 'clip_ratio/low_min': 0.00974138, 'clip_ratio/high_mean': 0.00804176, 'clip_ratio/high_max': 0.01153084, 'clip_ratio/region_mean': 0.0225722, 'step_time': 26.1855211, 'epoch': 0.0, 'global_step/max_steps': '15/9327', 'elapsed_time': '13m 52s', 'remaining_time': '5d 23h 33m 19s', 'memory(GiB)': 8.25, 'train_speed(s/it)': 55.498132}
81
+ [DEBUG generate] shape= (24, 244) last_col_pad_cnt= 0 first_col_pad_cnt= 12
82
+ [DEBUG generate] shape= (24, 244) last_col_pad_cnt= 0 first_col_pad_cnt= 12
83
+ [DEBUG generate] shape= (24, 253) last_col_pad_cnt= 0 first_col_pad_cnt= 12
84
+ [DEBUG generate] shape= (24, 253) last_col_pad_cnt= 0 first_col_pad_cnt= 12
85
+ [DEBUG generate] shape= (24, 244) last_col_pad_cnt= 0 first_col_pad_cnt= 12
86
+ [DEBUG generate] shape= (24, 244) last_col_pad_cnt= 0 first_col_pad_cnt= 12
87
+ [DEBUG generate] shape= (24, 277) last_col_pad_cnt= 0 first_col_pad_cnt= 12
88
+ [DEBUG generate] shape= (24, 277) last_col_pad_cnt= 0 first_col_pad_cnt= 12
89
+ [DEBUG generate] shape= (24, 236) last_col_pad_cnt= 0 first_col_pad_cnt= 12
90
+ [DEBUG generate] shape= (24, 236) last_col_pad_cnt= 0 first_col_pad_cnt= 12
91
+ [DEBUG generate] shape= (24, 252) last_col_pad_cnt= 0 first_col_pad_cnt= 12
92
+ [DEBUG generate] shape= (24, 252) last_col_pad_cnt= 0 first_col_pad_cnt= 12
93
+ [DEBUG generate] shape= (24, 157) last_col_pad_cnt= 0 first_col_pad_cnt= 12
94
+ [DEBUG generate] shape= (24, 157) last_col_pad_cnt= 0 first_col_pad_cnt= 12
95
+ [DEBUG generate] shape= (24, 252) last_col_pad_cnt= 0 first_col_pad_cnt= 12
96
+ [DEBUG generate] shape= (24, 252) last_col_pad_cnt= 0 first_col_pad_cnt= 12
97
+ [DEBUG generate] shape= (24, 239) last_col_pad_cnt= 0 first_col_pad_cnt= 12
98
+ [DEBUG generate] shape= (24, 239) last_col_pad_cnt= 0 first_col_pad_cnt= 12
99
+ [DEBUG generate] shape= (24, 251) last_col_pad_cnt= 0 first_col_pad_cnt= 12
100
+ [DEBUG generate] shape= (24, 251) last_col_pad_cnt= 0 first_col_pad_cnt= 12
101
+ {'loss': 0.00318602, 'grad_norm': 0.90874422, 'learning_rate': 3.57e-06, 'completions/mean_length': 48.42812653, 'completions/min_length': 30.25, 'completions/max_length': 61.4, 'completions/clipped_ratio': 0.0, 'reward': 0.02232184, 'reward_std': 0.16092061, 'frac_reward_zero_std': 0.0, 'rewards/ASRWerSubLenCmpHalluDirtyV56/mean': 0.02232184, 'rewards/ASRWerSubLenCmpHalluDirtyV56/std': 0.42085464, 'kl': 0.00529333, 'clip_ratio/low_mean': 0.01409527, 'clip_ratio/low_min': 0.00800156, 'clip_ratio/high_mean': 0.00843188, 'clip_ratio/high_max': 0.01220032, 'clip_ratio/region_mean': 0.02252715, 'step_time': 25.72940668, 'epoch': 0.01, 'global_step/max_steps': '20/9327', 'elapsed_time': '18m 13s', 'remaining_time': '5d 21h 15m 45s', 'memory(GiB)': 8.38, 'train_speed(s/it)': 54.641181}
102
+ [DEBUG generate] shape= (8, 245) last_col_pad_cnt= 0 first_col_pad_cnt= 4
103
+ Val: 4%|▍ | 2/53 [00:05<02:08, 2.53s/it][INFO:swift] last_model_checkpoint: None
104
+ [DEBUG generate] shape= (8, 238) last_col_pad_cnt= 0 first_col_pad_cnt= 4
105
+ [DEBUG generate] shape= (8, 249) last_col_pad_cnt= 0 first_col_pad_cnt= 4
106
+ [INFO:swift] best_model_checkpoint: None
107
+ Traceback (most recent call last):
108
+ File "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/lib/python3.10/site-packages/swift/cli/rlhf.py", line 7, in <module>
109
+ rlhf_main()
110
+ File "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/lib/python3.10/site-packages/swift/pipelines/train/rlhf.py", line 243, in rlhf_main
111
+ return SwiftRLHF(args).main()
112
+ File "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/lib/python3.10/site-packages/swift/pipelines/base.py", line 52, in main
113
+ result = self.run()
114
+ File "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/lib/python3.10/site-packages/swift/ray/base.py", line 168, in wrapper
115
+ return func(self, *args, **kwargs)
116
+ File "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/lib/python3.10/site-packages/swift/pipelines/train/sft.py", line 197, in run
117
+ return self.train(trainer)
118
+ File "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/lib/python3.10/site-packages/swift/pipelines/train/sft.py", line 270, in train
119
+ trainer.train(resume_checkpoint)
120
+ File "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/lib/python3.10/site-packages/swift/trainers/mixin.py", line 895, in train
121
+ res = super().train(*args, **kwargs)
122
+ File "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/lib/python3.10/site-packages/transformers/trainer.py", line 2325, in train
123
+ return inner_training_loop(
124
+ File "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/lib/python3.10/site-packages/transformers/trainer.py", line 2756, in _inner_training_loop
125
+ self._maybe_log_save_evaluate(
126
+ File "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/lib/python3.10/site-packages/swift/trainers/mixin.py", line 972, in _maybe_log_save_evaluate
127
+ super()._maybe_log_save_evaluate(tr_loss, *args, **kwargs)
128
+ File "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/lib/python3.10/site-packages/transformers/trainer.py", line 3221, in _maybe_log_save_evaluate
129
+ metrics = self._evaluate(trial, ignore_keys_for_eval)
130
+ File "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/lib/python3.10/site-packages/transformers/trainer.py", line 3170, in _evaluate
131
+ metrics = self.evaluate(ignore_keys=ignore_keys_for_eval)
132
+ File "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/lib/python3.10/site-packages/transformers/trainer.py", line 4489, in evaluate
133
+ output = eval_loop(
134
+ File "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/lib/python3.10/site-packages/swift/rlhf_trainers/grpo_trainer.py", line 1872, in evaluation_loop
135
+ output = super().evaluation_loop(dataloader, *args, **kwargs)
136
+ File "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/lib/python3.10/site-packages/transformers/trainer.py", line 4685, in evaluation_loop
137
+ losses, logits, labels = self.prediction_step(model, inputs, prediction_loss_only, ignore_keys=ignore_keys)
138
+ File "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/lib/python3.10/site-packages/trl/trainer/grpo_trainer.py", line 2293, in prediction_step
139
+ inputs = self._prepare_inputs(inputs)
140
+ File "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/lib/python3.10/site-packages/swift/rlhf_trainers/utils.py", line 607, in wrapper
141
+ return func(self, *args, **kwargs)
142
+ File "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/lib/python3.10/site-packages/swift/rlhf_trainers/grpo_trainer.py", line 208, in _prepare_inputs
143
+ inputs = self._generate_and_score_completions(generation_batch)
144
+ File "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/lib/python3.10/site-packages/swift/rlhf_trainers/utils.py", line 607, in wrapper
145
+ return func(self, *args, **kwargs)
146
+ File "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/lib/python3.10/site-packages/swift/rlhf_trainers/grpo_trainer.py", line 236, in _generate_and_score_completions
147
+ inputs = self._generate_completions(inputs)
148
+ File "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/lib/python3.10/site-packages/swift/rlhf_trainers/grpo_trainer.py", line 222, in _generate_completions
149
+ results = self._infer_single_or_multi_turn(inputs, self.request_config)
150
+ File "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/lib/python3.10/site-packages/swift/rlhf_trainers/rollout_mixin.py", line 733, in _infer_single_or_multi_turn
151
+ rollout_outputs: List[RolloutOutput] = self._rollout(inputs, request_config, is_global_inputs)
152
+ File "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/lib/python3.10/site-packages/swift/rlhf_trainers/rollout_mixin.py", line 697, in _rollout
153
+ rollout_outputs = self._colocate_rollout(inputs, request_config)
154
+ File "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/lib/python3.10/site-packages/swift/rlhf_trainers/rollout_mixin.py", line 1056, in _colocate_rollout
155
+ outputs: List[RolloutOutput] = self._engine_infer(infer_requests=inputs, request_config=request_config)
156
+ File "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/lib/python3.10/site-packages/swift/rlhf_trainers/rollout_mixin.py", line 1077, in _engine_infer
157
+ res = self.engine.infer(infer_requests, request_config, use_tqdm=use_tqdm)
158
+ File "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/lib/python3.10/site-packages/swift/infer_engine/transformers_engine.py", line 577, in infer
159
+ res += self._infer(infer_requests_samples, request_config, adapter_request=adapter_request)
160
+ File "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/lib/python3.10/site-packages/torch/utils/_contextlib.py", line 116, in decorate_context
161
+ return func(*args, **kwargs)
162
+ File "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/lib/python3.10/site-packages/swift/infer_engine/transformers_engine.py", line 546, in _infer
163
+ res = infer_func(**kwargs)
164
+ File "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/lib/python3.10/site-packages/swift/infer_engine/transformers_engine.py", line 397, in _infer_full
165
+ output = dict(self.template.generate(self.model, **generate_kwargs))
166
+ File "/mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/0416upload/my_qwen3_asr_dapo_register.py", line 670, in generate
167
+ return super().generate(model, *args, **kwargs)
168
+ File "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/lib/python3.10/site-packages/swift/template/base.py", line 666, in generate
169
+ return model.generate(*args, **kwargs)
170
+ File "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/lib/python3.10/site-packages/peft/peft_model.py", line 2048, in generate
171
+ outputs = self.base_model.generate(*args, **kwargs)
172
+ File "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/lib/python3.10/site-packages/torch/utils/_contextlib.py", line 116, in decorate_context
173
+ return func(*args, **kwargs)
174
+ File "/mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/Qwen3-ASR/qwen_asr/core/transformers_backend/modeling_qwen3_asr.py", line 1353, in generate
175
+ thinker_result = self.thinker.generate(input_ids=input_ids, return_dict_in_generate=True, **thinker_kwargs)
176
+ File "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/lib/python3.10/site-packages/torch/utils/_contextlib.py", line 116, in decorate_context
177
+ return func(*args, **kwargs)
178
+ File "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/lib/python3.10/site-packages/transformers/generation/utils.py", line 2566, in generate
179
+ result = decoding_method(
180
+ File "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/lib/python3.10/site-packages/transformers/generation/utils.py", line 2789, in _sample
181
+ outputs = model_forward(**model_inputs, return_dict=True)
182
+ File "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/lib/python3.10/site-packages/torch/nn/modules/module.py", line 1739, in _wrapped_call_impl
183
+ return self._call_impl(*args, **kwargs)
184
+ File "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/lib/python3.10/site-packages/torch/nn/modules/module.py", line 1750, in _call_impl
185
+ return forward_call(*args, **kwargs)
186
+ File "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/lib/python3.10/site-packages/transformers/utils/generic.py", line 918, in wrapper
187
+ output = func(self, *args, **kwargs)
188
+ File "/mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/Qwen3-ASR/qwen_asr/core/transformers_backend/modeling_qwen3_asr.py", line 1230, in forward
189
+ outputs = self.model(
190
+ File "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/lib/python3.10/site-packages/torch/nn/modules/module.py", line 1739, in _wrapped_call_impl
191
+ return self._call_impl(*args, **kwargs)
192
+ File "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/lib/python3.10/site-packages/torch/nn/modules/module.py", line 1750, in _call_impl
193
+ return forward_call(*args, **kwargs)
194
+ File "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/lib/python3.10/site-packages/transformers/utils/generic.py", line 1072, in wrapper
195
+ outputs = func(self, *args, **kwargs)
196
+ File "/mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/Qwen3-ASR/qwen_asr/core/transformers_backend/modeling_qwen3_asr.py", line 1043, in forward
197
+ layer_outputs = decoder_layer(
198
+ File "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/lib/python3.10/site-packages/transformers/modeling_layers.py", line 94, in __call__
199
+ return super().__call__(*args, **kwargs)
200
+ File "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/lib/python3.10/site-packages/torch/nn/modules/module.py", line 1739, in _wrapped_call_impl
201
+ return self._call_impl(*args, **kwargs)
202
+ File "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/lib/python3.10/site-packages/torch/nn/modules/module.py", line 1750, in _call_impl
203
+ return forward_call(*args, **kwargs)
204
+ File "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/lib/python3.10/site-packages/transformers/utils/deprecation.py", line 172, in wrapped_func
205
+ return func(*args, **kwargs)
206
+ File "/mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/Qwen3-ASR/qwen_asr/core/transformers_backend/modeling_qwen3_asr.py", line 262, in forward
207
+ hidden_states, _ = self.self_attn(
208
+ File "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/lib/python3.10/site-packages/torch/nn/modules/module.py", line 1739, in _wrapped_call_impl
209
+ return self._call_impl(*args, **kwargs)
210
+ File "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/lib/python3.10/site-packages/torch/nn/modules/module.py", line 1750, in _call_impl
211
+ return forward_call(*args, **kwargs)
212
+ File "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/lib/python3.10/site-packages/transformers/utils/deprecation.py", line 172, in wrapped_func
213
+ return func(*args, **kwargs)
214
+ File "/mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/Qwen3-ASR/qwen_asr/core/transformers_backend/modeling_qwen3_asr.py", line 188, in forward
215
+ query_states = self.q_norm(self.q_proj(hidden_states).view(hidden_shape)).transpose(1, 2)
216
+ KeyboardInterrupt
217
+ [rank0]: Traceback (most recent call last):
218
+ [rank0]: File "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/lib/python3.10/site-packages/swift/cli/rlhf.py", line 7, in <module>
219
+ [rank0]: rlhf_main()
220
+ [rank0]: File "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/lib/python3.10/site-packages/swift/pipelines/train/rlhf.py", line 243, in rlhf_main
221
+ [rank0]: return SwiftRLHF(args).main()
222
+ [rank0]: File "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/lib/python3.10/site-packages/swift/pipelines/base.py", line 52, in main
223
+ [rank0]: result = self.run()
224
+ [rank0]: File "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/lib/python3.10/site-packages/swift/ray/base.py", line 168, in wrapper
225
+ [rank0]: return func(self, *args, **kwargs)
226
+ [rank0]: File "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/lib/python3.10/site-packages/swift/pipelines/train/sft.py", line 197, in run
227
+ [rank0]: return self.train(trainer)
228
+ [rank0]: File "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/lib/python3.10/site-packages/swift/pipelines/train/sft.py", line 270, in train
229
+ [rank0]: trainer.train(resume_checkpoint)
230
+ [rank0]: File "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/lib/python3.10/site-packages/swift/trainers/mixin.py", line 895, in train
231
+ [rank0]: res = super().train(*args, **kwargs)
232
+ [rank0]: File "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/lib/python3.10/site-packages/transformers/trainer.py", line 2325, in train
233
+ [rank0]: return inner_training_loop(
234
+ [rank0]: File "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/lib/python3.10/site-packages/transformers/trainer.py", line 2756, in _inner_training_loop
235
+ [rank0]: self._maybe_log_save_evaluate(
236
+ [rank0]: File "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/lib/python3.10/site-packages/swift/trainers/mixin.py", line 972, in _maybe_log_save_evaluate
237
+ [rank0]: super()._maybe_log_save_evaluate(tr_loss, *args, **kwargs)
238
+ [rank0]: File "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/lib/python3.10/site-packages/transformers/trainer.py", line 3221, in _maybe_log_save_evaluate
239
+ [rank0]: metrics = self._evaluate(trial, ignore_keys_for_eval)
240
+ [rank0]: File "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/lib/python3.10/site-packages/transformers/trainer.py", line 3170, in _evaluate
241
+ [rank0]: metrics = self.evaluate(ignore_keys=ignore_keys_for_eval)
242
+ [rank0]: File "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/lib/python3.10/site-packages/transformers/trainer.py", line 4489, in evaluate
243
+ [rank0]: output = eval_loop(
244
+ [rank0]: File "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/lib/python3.10/site-packages/swift/rlhf_trainers/grpo_trainer.py", line 1872, in evaluation_loop
245
+ [rank0]: output = super().evaluation_loop(dataloader, *args, **kwargs)
246
+ [rank0]: File "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/lib/python3.10/site-packages/transformers/trainer.py", line 4685, in evaluation_loop
247
+ [rank0]: losses, logits, labels = self.prediction_step(model, inputs, prediction_loss_only, ignore_keys=ignore_keys)
248
+ [rank0]: File "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/lib/python3.10/site-packages/trl/trainer/grpo_trainer.py", line 2293, in prediction_step
249
+ [rank0]: inputs = self._prepare_inputs(inputs)
250
+ [rank0]: File "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/lib/python3.10/site-packages/swift/rlhf_trainers/utils.py", line 607, in wrapper
251
+ [rank0]: return func(self, *args, **kwargs)
252
+ [rank0]: File "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/lib/python3.10/site-packages/swift/rlhf_trainers/grpo_trainer.py", line 208, in _prepare_inputs
253
+ [rank0]: inputs = self._generate_and_score_completions(generation_batch)
254
+ [rank0]: File "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/lib/python3.10/site-packages/swift/rlhf_trainers/utils.py", line 607, in wrapper
255
+ [rank0]: return func(self, *args, **kwargs)
256
+ [rank0]: File "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/lib/python3.10/site-packages/swift/rlhf_trainers/grpo_trainer.py", line 236, in _generate_and_score_completions
257
+ [rank0]: inputs = self._generate_completions(inputs)
258
+ [rank0]: File "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/lib/python3.10/site-packages/swift/rlhf_trainers/grpo_trainer.py", line 222, in _generate_completions
259
+ [rank0]: results = self._infer_single_or_multi_turn(inputs, self.request_config)
260
+ [rank0]: File "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/lib/python3.10/site-packages/swift/rlhf_trainers/rollout_mixin.py", line 733, in _infer_single_or_multi_turn
261
+ [rank0]: rollout_outputs: List[RolloutOutput] = self._rollout(inputs, request_config, is_global_inputs)
262
+ [rank0]: File "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/lib/python3.10/site-packages/swift/rlhf_trainers/rollout_mixin.py", line 697, in _rollout
263
+ [rank0]: rollout_outputs = self._colocate_rollout(inputs, request_config)
264
+ [rank0]: File "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/lib/python3.10/site-packages/swift/rlhf_trainers/rollout_mixin.py", line 1056, in _colocate_rollout
265
+ [rank0]: outputs: List[RolloutOutput] = self._engine_infer(infer_requests=inputs, request_config=request_config)
266
+ [rank0]: File "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/lib/python3.10/site-packages/swift/rlhf_trainers/rollout_mixin.py", line 1077, in _engine_infer
267
+ [rank0]: res = self.engine.infer(infer_requests, request_config, use_tqdm=use_tqdm)
268
+ [rank0]: File "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/lib/python3.10/site-packages/swift/infer_engine/transformers_engine.py", line 577, in infer
269
+ [rank0]: res += self._infer(infer_requests_samples, request_config, adapter_request=adapter_request)
270
+ [rank0]: File "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/lib/python3.10/site-packages/torch/utils/_contextlib.py", line 116, in decorate_context
271
+ [rank0]: return func(*args, **kwargs)
272
+ [rank0]: File "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/lib/python3.10/site-packages/swift/infer_engine/transformers_engine.py", line 546, in _infer
273
+ [rank0]: res = infer_func(**kwargs)
274
+ [rank0]: File "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/lib/python3.10/site-packages/swift/infer_engine/transformers_engine.py", line 397, in _infer_full
275
+ [rank0]: output = dict(self.template.generate(self.model, **generate_kwargs))
276
+ [rank0]: File "/mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/0416upload/my_qwen3_asr_dapo_register.py", line 670, in generate
277
+ [rank0]: return super().generate(model, *args, **kwargs)
278
+ [rank0]: File "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/lib/python3.10/site-packages/swift/template/base.py", line 666, in generate
279
+ [rank0]: return model.generate(*args, **kwargs)
280
+ [rank0]: File "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/lib/python3.10/site-packages/peft/peft_model.py", line 2048, in generate
281
+ [rank0]: outputs = self.base_model.generate(*args, **kwargs)
282
+ [rank0]: File "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/lib/python3.10/site-packages/torch/utils/_contextlib.py", line 116, in decorate_context
283
+ [rank0]: return func(*args, **kwargs)
284
+ [rank0]: File "/mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/Qwen3-ASR/qwen_asr/core/transformers_backend/modeling_qwen3_asr.py", line 1353, in generate
285
+ [rank0]: thinker_result = self.thinker.generate(input_ids=input_ids, return_dict_in_generate=True, **thinker_kwargs)
286
+ [rank0]: File "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/lib/python3.10/site-packages/torch/utils/_contextlib.py", line 116, in decorate_context
287
+ [rank0]: return func(*args, **kwargs)
288
+ [rank0]: File "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/lib/python3.10/site-packages/transformers/generation/utils.py", line 2566, in generate
289
+ [rank0]: result = decoding_method(
290
+ [rank0]: File "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/lib/python3.10/site-packages/transformers/generation/utils.py", line 2789, in _sample
291
+ [rank0]: outputs = model_forward(**model_inputs, return_dict=True)
292
+ [rank0]: File "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/lib/python3.10/site-packages/torch/nn/modules/module.py", line 1739, in _wrapped_call_impl
293
+ [rank0]: return self._call_impl(*args, **kwargs)
294
+ [rank0]: File "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/lib/python3.10/site-packages/torch/nn/modules/module.py", line 1750, in _call_impl
295
+ [rank0]: return forward_call(*args, **kwargs)
296
+ [rank0]: File "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/lib/python3.10/site-packages/transformers/utils/generic.py", line 918, in wrapper
297
+ [rank0]: output = func(self, *args, **kwargs)
298
+ [rank0]: File "/mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/Qwen3-ASR/qwen_asr/core/transformers_backend/modeling_qwen3_asr.py", line 1230, in forward
299
+ [rank0]: outputs = self.model(
300
+ [rank0]: File "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/lib/python3.10/site-packages/torch/nn/modules/module.py", line 1739, in _wrapped_call_impl
301
+ [rank0]: return self._call_impl(*args, **kwargs)
302
+ [rank0]: File "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/lib/python3.10/site-packages/torch/nn/modules/module.py", line 1750, in _call_impl
303
+ [rank0]: return forward_call(*args, **kwargs)
304
+ [rank0]: File "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/lib/python3.10/site-packages/transformers/utils/generic.py", line 1072, in wrapper
305
+ [rank0]: outputs = func(self, *args, **kwargs)
306
+ [rank0]: File "/mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/Qwen3-ASR/qwen_asr/core/transformers_backend/modeling_qwen3_asr.py", line 1043, in forward
307
+ [rank0]: layer_outputs = decoder_layer(
308
+ [rank0]: File "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/lib/python3.10/site-packages/transformers/modeling_layers.py", line 94, in __call__
309
+ [rank0]: return super().__call__(*args, **kwargs)
310
+ [rank0]: File "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/lib/python3.10/site-packages/torch/nn/modules/module.py", line 1739, in _wrapped_call_impl
311
+ [rank0]: return self._call_impl(*args, **kwargs)
312
+ [rank0]: File "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/lib/python3.10/site-packages/torch/nn/modules/module.py", line 1750, in _call_impl
313
+ [rank0]: return forward_call(*args, **kwargs)
314
+ [rank0]: File "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/lib/python3.10/site-packages/transformers/utils/deprecation.py", line 172, in wrapped_func
315
+ [rank0]: return func(*args, **kwargs)
316
+ [rank0]: File "/mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/Qwen3-ASR/qwen_asr/core/transformers_backend/modeling_qwen3_asr.py", line 262, in forward
317
+ [rank0]: hidden_states, _ = self.self_attn(
318
+ [rank0]: File "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/lib/python3.10/site-packages/torch/nn/modules/module.py", line 1739, in _wrapped_call_impl
319
+ [rank0]: return self._call_impl(*args, **kwargs)
320
+ [rank0]: File "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/lib/python3.10/site-packages/torch/nn/modules/module.py", line 1750, in _call_impl
321
+ [rank0]: return forward_call(*args, **kwargs)
322
+ [rank0]: File "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/lib/python3.10/site-packages/transformers/utils/deprecation.py", line 172, in wrapped_func
323
+ [rank0]: return func(*args, **kwargs)
324
+ [rank0]: File "/mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/Qwen3-ASR/qwen_asr/core/transformers_backend/modeling_qwen3_asr.py", line 188, in forward
325
+ [rank0]: query_states = self.q_norm(self.q_proj(hidden_states).view(hidden_shape)).transpose(1, 2)
326
+ [rank0]: KeyboardInterrupt
wandb/run-20260417_123237-3h84yfea/files/requirements.txt ADDED
@@ -0,0 +1,255 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ psutil==7.2.2
2
+ colorama==0.4.6
3
+ typing-inspection==0.4.2
4
+ dill==0.3.8
5
+ aliyun-python-sdk-kms==2.16.5
6
+ urllib3==2.6.3
7
+ torch==2.6.0
8
+ threadpoolctl==3.6.0
9
+ pyzmq==27.1.0
10
+ astor==0.8.1
11
+ hf-xet==1.4.3
12
+ sniffio==1.3.1
13
+ tensorboard==2.20.0
14
+ fastar==0.11.0
15
+ llvmlite==0.43.0
16
+ pathspec==1.0.4
17
+ mkl_fft==1.3.11
18
+ prometheus_client==0.25.0
19
+ async-timeout==5.0.1
20
+ scikit-learn==1.7.2
21
+ sortedcontainers==2.4.0
22
+ Bottleneck==1.4.2
23
+ orjson==3.11.8
24
+ nest-asyncio==1.6.0
25
+ cupy-cuda12x==13.6.0
26
+ semantic-version==2.10.0
27
+ aiosignal==1.4.0
28
+ fsspec==2025.3.0
29
+ dyNET38==2.2
30
+ shellingham==1.5.4
31
+ zstandard==0.25.0
32
+ PyYAML==6.0.3
33
+ nvidia-curand-cu12==10.3.5.147
34
+ gradio==5.50.0
35
+ Werkzeug==3.1.8
36
+ grpcio==1.80.0
37
+ aiohttp==3.13.5
38
+ Flask==3.1.3
39
+ python-json-logger==4.1.0
40
+ trl==0.29.1
41
+ nltk==3.9.4
42
+ platformdirs==4.9.6
43
+ lm-format-enforcer==0.10.12
44
+ pyparsing==3.3.2
45
+ jmespath==0.10.0
46
+ starlette==0.52.1
47
+ crcmod==1.7
48
+ dnspython==2.8.0
49
+ antlr4-python3-runtime==4.9.3
50
+ rouge==1.0.1
51
+ importlib_metadata==9.0.0
52
+ nvidia-cudnn-cu12==9.1.0.70
53
+ safetensors==0.7.0
54
+ blake3==1.0.8
55
+ interegular==0.3.3
56
+ tiktoken==0.11.0
57
+ pydantic_core==2.41.4
58
+ outlines==0.1.11
59
+ airportsdata==20260315
60
+ rich-toolkit==0.19.7
61
+ multiprocess==0.70.16
62
+ sympy==1.13.1
63
+ psutil==7.2.2
64
+ h11==0.16.0
65
+ anyio==4.13.0
66
+ Cython==3.2.4
67
+ outlines_core==0.1.26
68
+ jsonschema==4.26.0
69
+ nvidia-cuda-cupti-cu12==12.4.127
70
+ meson-python==0.19.0
71
+ depyf==0.18.0
72
+ audioread==3.1.0
73
+ typer==0.24.1
74
+ nvidia-cuda-nvrtc-cu12==12.4.127
75
+ joblib==1.5.3
76
+ torchvision==0.21.0
77
+ hf-gradio==0.3.2
78
+ huggingface_hub==0.36.2
79
+ websockets==15.0.1
80
+ diskcache==5.6.3
81
+ mistral_common==1.11.0
82
+ partial-json-parser==0.2.1.1.post7
83
+ simplejson==3.20.2
84
+ watchfiles==1.1.1
85
+ Jinja2==3.1.6
86
+ GitPython==3.1.46
87
+ numexpr==2.11.0
88
+ pydub==0.25.1
89
+ brotli==1.2.0
90
+ binpacking==2.0.1
91
+ cmake==4.3.1
92
+ pydantic==2.12.3
93
+ mkl-service==2.4.0
94
+ protobuf==6.33.6
95
+ gguf==0.10.0
96
+ MarkupSafe==3.0.3
97
+ exceptiongroup==1.3.1
98
+ markdown-it-py==4.0.0
99
+ soxr==1.0.0
100
+ pyarrow==20.0.0
101
+ tqdm==4.67.3
102
+ meson==1.11.0
103
+ fonttools==4.62.1
104
+ annotated-types==0.7.0
105
+ networkx==3.4.2
106
+ nvidia-cuda-runtime-cu12==12.4.127
107
+ compressed-tensors==0.9.2
108
+ wandb==0.23.0
109
+ mdurl==0.1.2
110
+ charset-normalizer==3.4.7
111
+ Pygments==2.20.0
112
+ zipp==3.23.1
113
+ prometheus-fastapi-instrumentator==7.1.0
114
+ aiofiles==24.1.0
115
+ lark==1.2.2
116
+ addict==2.4.0
117
+ pydantic-settings==2.13.1
118
+ opencv-python-headless==4.11.0.86
119
+ certifi==2026.2.25
120
+ sox==1.5.0
121
+ nagisa==0.2.11
122
+ six==1.17.0
123
+ tokenizers==0.22.2
124
+ mkl_random==1.2.8
125
+ fastapi-cloud-cli==0.17.0
126
+ propcache==0.4.1
127
+ cachetools==7.0.5
128
+ rpds-py==0.30.0
129
+ torchaudio==2.6.0
130
+ setuptools==82.0.1
131
+ py-cpuinfo==9.0.0
132
+ tomli==2.4.1
133
+ xxhash==3.6.0
134
+ pip==26.0.1
135
+ contourpy==1.3.2
136
+ absl-py==2.4.0
137
+ mpmath==1.3.0
138
+ ms_swift==4.0.3
139
+ pyproject-metadata==0.11.0
140
+ aiohappyeyeballs==2.6.1
141
+ httpx==0.28.1
142
+ json_repair==0.59.4
143
+ blinker==1.9.0
144
+ tzdata==2025.3
145
+ tensorboard-data-server==0.7.2
146
+ pydantic-extra-types==2.11.1
147
+ Markdown==3.10.2
148
+ nvidia-cusparselt-cu12==0.6.2
149
+ rignore==0.7.6
150
+ openai==2.32.0
151
+ soundfile==0.13.1
152
+ lazy-loader==0.5
153
+ av==14.2.0
154
+ yarl==1.23.0
155
+ python-dateutil==2.9.0.post0
156
+ groovy==0.1.2
157
+ xformers==0.0.29.post2
158
+ qwen-omni-utils==0.0.9
159
+ rich==15.0.0
160
+ xgrammar==0.1.16
161
+ numba==0.60.0
162
+ nvidia-cusolver-cu12==11.6.1.9
163
+ scikit_build_core==0.12.2
164
+ ffmpy==1.0.0
165
+ wheel==0.46.3
166
+ jiter==0.14.0
167
+ oss2==2.19.1
168
+ transformers==4.57.6
169
+ fastrlock==0.8.3
170
+ click==8.3.2
171
+ pooch==1.9.0
172
+ distro==1.9.0
173
+ nvidia-cublas-cu12==12.4.5.8
174
+ regex==2026.4.4
175
+ cpm-kernels==1.0.11
176
+ safehttpx==0.1.7
177
+ matplotlib==3.10.8
178
+ httptools==0.7.1
179
+ nvidia-cusparse-cu12==12.3.1.170
180
+ qwen-asr==0.0.6
181
+ gradio_client==1.14.0
182
+ gitdb==4.0.12
183
+ fastapi-cli==0.0.24
184
+ soynlp==0.0.493
185
+ python-dotenv==1.2.2
186
+ nvidia-cufft-cu12==11.2.1.3
187
+ accelerate==1.12.0
188
+ tomlkit==0.13.3
189
+ triton==3.2.0
190
+ filelock==3.28.0
191
+ pycountry==26.2.16
192
+ modelscope==1.35.4
193
+ annotated-doc==0.0.4
194
+ referencing==0.37.0
195
+ numpy==1.26.4
196
+ aliyun-python-sdk-core==2.16.0
197
+ attrs==26.1.0
198
+ vllm==0.8.0
199
+ python-multipart==0.0.26
200
+ jsonschema-specifications==2025.9.1
201
+ idna==3.11
202
+ scipy==1.15.3
203
+ typing_extensions==4.15.0
204
+ itsdangerous==2.2.0
205
+ msgspec==0.21.1
206
+ msgpack==1.1.2
207
+ nvidia-nvjitlink-cu12==12.4.127
208
+ pycryptodome==3.23.0
209
+ ninja==1.13.0
210
+ pillow==11.3.0
211
+ email-validator==2.3.0
212
+ cryptography==46.0.7
213
+ peft==0.18.1
214
+ kiwisolver==1.5.0
215
+ cffi==2.0.0
216
+ einops==0.8.2
217
+ pytz==2026.1.post1
218
+ uvloop==0.22.1
219
+ requests==2.33.1
220
+ sentencepiece==0.2.1
221
+ attrdict==2.0.1
222
+ dacite==1.9.2
223
+ cloudpickle==3.1.2
224
+ ray==2.55.0
225
+ fastapi==0.135.3
226
+ librosa==0.11.0
227
+ ruff==0.15.10
228
+ multidict==6.7.1
229
+ smmap==5.0.3
230
+ packaging==26.0
231
+ pycparser==3.0
232
+ decorator==5.2.1
233
+ transformers-stream-generator==0.0.5
234
+ nvidia-nccl-cu12==2.21.5
235
+ frozenlist==1.8.0
236
+ uvicorn==0.44.0
237
+ datasets==3.6.0
238
+ cycler==0.12.1
239
+ omegaconf==2.3.0
240
+ httpcore==1.0.9
241
+ pandas==2.3.2
242
+ nvidia-nvtx-cu12==12.4.127
243
+ sentry-sdk==2.58.0
244
+ wheel==0.46.3
245
+ autocommand==2.2.2
246
+ tomli==2.4.0
247
+ packaging==26.0
248
+ more-itertools==10.8.0
249
+ zipp==3.23.0
250
+ platformdirs==4.4.0
251
+ jaraco.context==6.1.0
252
+ jaraco.text==4.0.0
253
+ backports.tarfile==1.2.0
254
+ jaraco.functools==4.4.0
255
+ importlib_metadata==8.7.1
wandb/run-20260417_123237-3h84yfea/files/wandb-metadata.json ADDED
@@ -0,0 +1,223 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "os": "Linux-3.10.0-957.el7.x86_64-x86_64-with-glibc2.17",
3
+ "python": "CPython 3.10.18",
4
+ "startedAt": "2026-04-17T04:32:37.414555Z",
5
+ "args": [
6
+ "--rlhf_type",
7
+ "grpo",
8
+ "--external_plugins",
9
+ "/mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/0416upload/my_qwen3_asr_dapo_register.py",
10
+ "/mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/0416upload/0417_reward.py",
11
+ "--model",
12
+ "/mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/qwen3-asr-merged",
13
+ "--model_type",
14
+ "my_qwen3_asr_rl",
15
+ "--template",
16
+ "my_qwen3_asr_rl",
17
+ "--dataset",
18
+ "/mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/0416upload/lora_0323_10w+55w+error+syn_with_domain_train90_targeted_rl_train90_loramerged_basewer_3suppress_server.jsonl",
19
+ "--val_dataset",
20
+ "/mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/0416upload/lora_0323_10w+55w+error+syn_with_domain_train90_targeted_rl_val5_sample5p_server.jsonl",
21
+ "--reward_funcs",
22
+ "asr_wer_sub_len_cmp_hallu_dirty_v56",
23
+ "--train_type",
24
+ "lora",
25
+ "--use_vllm",
26
+ "false",
27
+ "--log_completions",
28
+ "true",
29
+ "--loss_type",
30
+ "dapo",
31
+ "--advantage_estimator",
32
+ "grpo",
33
+ "--scale_rewards",
34
+ "group",
35
+ "--num_iterations",
36
+ "2",
37
+ "--beta",
38
+ "0.04",
39
+ "--epsilon_high",
40
+ "0.28",
41
+ "--dynamic_sample",
42
+ "true",
43
+ "--max_resample_times",
44
+ "4",
45
+ "--overlong_filter",
46
+ "true",
47
+ "--truncation_strategy",
48
+ "delete",
49
+ "--num_generations",
50
+ "12",
51
+ "--generation_batch_size",
52
+ "48",
53
+ "--per_device_train_batch_size",
54
+ "8",
55
+ "--per_device_eval_batch_size",
56
+ "8",
57
+ "--gradient_accumulation_steps",
58
+ "12",
59
+ "--num_generations_eval",
60
+ "4",
61
+ "--max_completion_length",
62
+ "256",
63
+ "--temperature",
64
+ "0.50",
65
+ "--top_p",
66
+ "0.95",
67
+ "--top_k",
68
+ "50",
69
+ "--repetition_penalty",
70
+ "1.08",
71
+ "--learning_rate",
72
+ "5e-5",
73
+ "--lr_scheduler_type",
74
+ "cosine",
75
+ "--warmup_ratio",
76
+ "0.03",
77
+ "--report_to",
78
+ "wandb",
79
+ "--run_name",
80
+ "qwen3asr_dapo_reward56_4x4x12_12gen_4GPU",
81
+ "--output_dir",
82
+ "/mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/0416upload/out/qwen3asr_dapo_reward56_4x4x12_12gen_4GPU",
83
+ "--save_strategy",
84
+ "steps",
85
+ "--save_steps",
86
+ "20",
87
+ "--logging_steps",
88
+ "5",
89
+ "--freeze_llm",
90
+ "false",
91
+ "--freeze_vit",
92
+ "false",
93
+ "--freeze_aligner",
94
+ "false",
95
+ "--remove_unused_columns",
96
+ "false",
97
+ "--padding_side",
98
+ "left"
99
+ ],
100
+ "program": "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/lib/python3.10/site-packages/swift/cli/rlhf.py",
101
+ "email": "pang_kaiyu@163.com",
102
+ "root": "/mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/0416upload",
103
+ "host": "SH-IDC1-10-140-37-1",
104
+ "executable": "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/bin/python3.10",
105
+ "cpu_count": 64,
106
+ "cpu_count_logical": 128,
107
+ "gpu": "NVIDIA A100-SXM4-80GB",
108
+ "gpu_count": 8,
109
+ "disk": {
110
+ "/": {
111
+ "total": "524945911808",
112
+ "used": "105544630272"
113
+ }
114
+ },
115
+ "memory": {
116
+ "total": "1081627828224"
117
+ },
118
+ "gpu_nvidia": [
119
+ {
120
+ "name": "NVIDIA A100-SXM4-80GB",
121
+ "memoryTotal": "85899345920",
122
+ "cudaCores": 6912,
123
+ "architecture": "Ampere",
124
+ "uuid": "GPU-51466de9-a668-3c7e-bb90-bb8c112e0fea"
125
+ },
126
+ {
127
+ "name": "NVIDIA A100-SXM4-80GB",
128
+ "memoryTotal": "85899345920",
129
+ "cudaCores": 6912,
130
+ "architecture": "Ampere",
131
+ "uuid": "GPU-ec1a5f87-66dd-26c2-5656-b57c7015a595"
132
+ },
133
+ {
134
+ "name": "NVIDIA A100-SXM4-80GB",
135
+ "memoryTotal": "85899345920",
136
+ "cudaCores": 6912,
137
+ "architecture": "Ampere",
138
+ "uuid": "GPU-2dabb104-8ec6-09ec-017a-204779e18c19"
139
+ },
140
+ {
141
+ "name": "NVIDIA A100-SXM4-80GB",
142
+ "memoryTotal": "85899345920",
143
+ "cudaCores": 6912,
144
+ "architecture": "Ampere",
145
+ "uuid": "GPU-0e67540a-1930-f39b-320f-0a6bfe1da2e0"
146
+ },
147
+ {
148
+ "name": "NVIDIA A100-SXM4-80GB",
149
+ "memoryTotal": "85899345920",
150
+ "cudaCores": 6912,
151
+ "architecture": "Ampere",
152
+ "uuid": "GPU-b46e583c-5ac8-e350-6045-49ad7b17c092"
153
+ },
154
+ {
155
+ "name": "NVIDIA A100-SXM4-80GB",
156
+ "memoryTotal": "85899345920",
157
+ "cudaCores": 6912,
158
+ "architecture": "Ampere",
159
+ "uuid": "GPU-f293d16a-41a0-fbc1-e86c-4f9682cb5e2b"
160
+ },
161
+ {
162
+ "name": "NVIDIA A100-SXM4-80GB",
163
+ "memoryTotal": "85899345920",
164
+ "cudaCores": 6912,
165
+ "architecture": "Ampere",
166
+ "uuid": "GPU-67958330-9199-dca8-5c2e-c665b13b3452"
167
+ },
168
+ {
169
+ "name": "NVIDIA A100-SXM4-80GB",
170
+ "memoryTotal": "85899345920",
171
+ "cudaCores": 6912,
172
+ "architecture": "Ampere",
173
+ "uuid": "GPU-6b56602f-4dcf-cb9d-4e98-04bf6254b789"
174
+ }
175
+ ],
176
+ "cudaVersion": "12.4",
177
+ "slurm": {
178
+ "cluster_name": "cluster_sproject3",
179
+ "conf": "/etc/slurm/slurm.conf",
180
+ "cpus_on_node": "2",
181
+ "gtids": "0",
182
+ "job_account": "research",
183
+ "job_cpus_per_node": "2",
184
+ "job_gid": "800000689",
185
+ "job_id": "8568802",
186
+ "job_name": "qwen_debug",
187
+ "job_nodelist": "SH-IDC1-10-140-37-1",
188
+ "job_num_nodes": "1",
189
+ "job_partition": "interntmp",
190
+ "job_qos": "normal",
191
+ "job_uid": "800000689",
192
+ "job_user": "panjiabao",
193
+ "jobid": "8568802",
194
+ "launch_node_ipaddr": "10.140.37.164",
195
+ "localid": "0",
196
+ "nnodes": "1",
197
+ "nodeid": "0",
198
+ "nodelist": "SH-IDC1-10-140-37-1",
199
+ "nprocs": "1",
200
+ "ntasks": "1",
201
+ "prio_process": "0",
202
+ "procid": "0",
203
+ "srun_comm_host": "10.140.37.164",
204
+ "srun_comm_port": "44570",
205
+ "step_gpus": "4,5",
206
+ "step_id": "0",
207
+ "step_launcher_port": "44570",
208
+ "step_nodelist": "SH-IDC1-10-140-37-1",
209
+ "step_num_nodes": "1",
210
+ "step_num_tasks": "1",
211
+ "step_tasks_per_node": "1",
212
+ "stepid": "0",
213
+ "submit_dir": "/mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/0416upload",
214
+ "submit_host": "SH-IDC1-10-140-37-164",
215
+ "task_pid": "24357",
216
+ "tasks_per_node": "1",
217
+ "topology_addr": "SH-IDC1-10-140-37-1",
218
+ "topology_addr_pattern": "node",
219
+ "umask": "0002",
220
+ "working_cluster": "cluster_sproject3:SH-IDC1-10-140-37-161:6817:9216:109"
221
+ },
222
+ "writerId": "bpic2cpmtxvnwca2pu2tg19g1j2qwpb2"
223
+ }
wandb/run-20260417_123237-3h84yfea/files/wandb-summary.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"_step":10,"train/clip_ratio/high_max":0.012200319871772081,"_runtime":1109.549686456,"train/rewards/ASRWerSubLenCmpHalluDirtyV56/std":0.4208546429872513,"profiling/Time taken: GRPOTrainer.ASRWerSubLenCmpHalluDirtyV56":0.05729236314073205,"train/learning_rate":3.5714285714285714e-06,"profiling/Time taken: GRPOTrainer._prepare_batch_inputs":0.7034707930870354,"train/reward":0.022321835905313493,"profiling/Time taken: GRPOTrainer.generate":3.802002454176545,"train/epoch":0.0064329366355741395,"train/frac_reward_zero_std":0,"train/clip_ratio/low_mean":0.014095272546789299,"train/clip_ratio/region_mean":0.02252715122886002,"train/completions/max_length":61.4,"train/completions/mean_length":48.42812652587891,"train/completions/min_length":30.25,"train/clip_ratio/low_min":0.008001556829549372,"train/kl":0.00529333179583773,"completions":{"path":"media/table/completions_9_ec21142175e3781c9ddd.table.json","ncols":6,"log_mode":"IMMUTABLE","_type":"table-file","artifact_path":"wandb-client-artifact://kz4vrnypdmle4zgoj3c84weqxmxkvdxftnrs55geadw9knsskgfo49q6n1xtl9bk3gu4h9ojvabrseb66dnps3myxgfrem7lvv7fjv618wfxr5ofpjviqu6xhn9nlkki/completions.table.json","size":30810,"nrows":48,"_latest_artifact_path":"wandb-client-artifact://b69jh609tckqry5pvjdgc75co4t33phnplrzajmhbdyubzbumzvvphifhlwul9nw1lkqc2xwcxwq9l1gnv9ymu6hjz8nv21mkh590wyd7n2m3v6vfjc58y4w8x9kkji0:latest/completions.table.json","sha256":"ec21142175e3781c9ddd0e8bcbb9129cea8a4112a1677ab3a9541e1a4670ca03"},"profiling/Time taken: GRPOTrainer.compute_loss":0.38397085713222623,"train/clip_ratio/high_mean":0.008431878668488935,"train/global_step":20,"train/step_time":25.729406683100386,"profiling/Time taken: GRPOTrainer._score_completions":0.05837428104132414,"profiling/Time taken: GRPOTrainer.log_metrics":0.00924607808701694,"train/loss":0.0031860221177339556,"_wandb":{"runtime":1109},"profiling/Time taken: GRPOTrainer._get_per_token_logps_and_entropies":0.34411595296114683,"profiling/Time taken: GRPOTrainer._generate_and_score_completions":4.66908916993998,"_timestamp":1.7764014649839177e+09,"profiling/Time taken: GRPOTrainer._prepare_inputs":4.669255583081394,"train/reward_std":0.1609206058084965,"train/completions/clipped_ratio":0,"profiling/Time taken: GRPOTrainer.resample_encode_failed_inputs":0.07994826301001012,"profiling/Time taken: GRPOTrainer._dynamic_sampling":1.0511806420981884,"train/rewards/ASRWerSubLenCmpHalluDirtyV56/mean":0.02232184025924653,"train/grad_norm":0.908744215965271}
wandb/run-20260417_123237-3h84yfea/logs/debug-core.log ADDED
@@ -0,0 +1,14 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {"time":"2026-04-17T12:32:37.733571714+08:00","level":"INFO","msg":"main: starting server","port-filename":"/tmp/tmp6lseefed/port-26590.txt","pid":26590,"log-level":0,"disable-analytics":false,"shutdown-on-parent-exit":false,"enable-dcgm-profiling":false}
2
+ {"time":"2026-04-17T12:32:37.736196619+08:00","level":"INFO","msg":"server: will exit if parent process dies","ppid":26590}
3
+ {"time":"2026-04-17T12:32:37.736232389+08:00","level":"INFO","msg":"server: accepting connections","addr":{"Name":"/tmp/wandb-26590-39544-1290766967/socket","Net":"unix"}}
4
+ {"time":"2026-04-17T12:32:37.819031966+08:00","level":"INFO","msg":"connection: ManageConnectionData: new connection created","id":"1(@)"}
5
+ {"time":"2026-04-17T12:32:37.828108271+08:00","level":"INFO","msg":"handleInformInit: received","streamId":"3h84yfea","id":"1(@)"}
6
+ {"time":"2026-04-17T12:32:38.291204091+08:00","level":"INFO","msg":"handleInformInit: stream started","streamId":"3h84yfea","id":"1(@)"}
7
+ {"time":"2026-04-17T12:51:08.851141958+08:00","level":"INFO","msg":"handleInformTeardown: server teardown initiated","id":"1(@)"}
8
+ {"time":"2026-04-17T12:51:08.851692926+08:00","level":"INFO","msg":"server is shutting down"}
9
+ {"time":"2026-04-17T12:51:08.851679858+08:00","level":"INFO","msg":"connection: closing","id":"1(@)"}
10
+ {"time":"2026-04-17T12:51:08.852412712+08:00","level":"INFO","msg":"server: listener closed","addr":{"Name":"/tmp/wandb-26590-39544-1290766967/socket","Net":"unix"}}
11
+ {"time":"2026-04-17T12:51:08.852821471+08:00","level":"INFO","msg":"connection: closed successfully","id":"1(@)"}
12
+ {"time":"2026-04-17T12:51:45.045595577+08:00","level":"INFO","msg":"handleInformTeardown: server shutdown complete","id":"1(@)"}
13
+ {"time":"2026-04-17T12:51:45.046301783+08:00","level":"INFO","msg":"connection: ManageConnectionData: connection closed","id":"1(@)"}
14
+ {"time":"2026-04-17T12:51:45.046872221+08:00","level":"INFO","msg":"server is closed"}
wandb/run-20260417_123237-3h84yfea/logs/debug-internal.log ADDED
@@ -0,0 +1,14 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {"time":"2026-04-17T12:32:37.831597637+08:00","level":"INFO","msg":"stream: starting","core version":"0.23.0"}
2
+ {"time":"2026-04-17T12:32:38.28711188+08:00","level":"INFO","msg":"stream: created new stream","id":"3h84yfea"}
3
+ {"time":"2026-04-17T12:32:38.287178211+08:00","level":"INFO","msg":"handler: started","stream_id":"3h84yfea"}
4
+ {"time":"2026-04-17T12:32:38.291195021+08:00","level":"INFO","msg":"stream: started","id":"3h84yfea"}
5
+ {"time":"2026-04-17T12:32:38.291204401+08:00","level":"INFO","msg":"sender: started","stream_id":"3h84yfea"}
6
+ {"time":"2026-04-17T12:32:38.291218278+08:00","level":"INFO","msg":"writer: started","stream_id":"3h84yfea"}
7
+ {"time":"2026-04-17T12:47:19.109479888+08:00","level":"INFO","msg":"api: retrying HTTP error","status":500,"url":"https://api.wandb.ai/files/pang_kaiyu-none/qwen3_asr_swift_dapo/3h84yfea/file_stream","body":"{\"error\":\"context deadline exceeded\"}"}
8
+ {"time":"2026-04-17T12:51:08.790892907+08:00","level":"INFO","msg":"flowcontrol: backed up, offloading to disk","recordNumber":1780}
9
+ {"time":"2026-04-17T12:51:08.792427055+08:00","level":"INFO","msg":"flowcontrol: unblocked","totalOffloaded":34}
10
+ {"time":"2026-04-17T12:51:08.85169372+08:00","level":"INFO","msg":"stream: closing","id":"3h84yfea"}
11
+ {"time":"2026-04-17T12:51:10.104739264+08:00","level":"INFO","msg":"fileTransfer: Close: file transfer manager closed"}
12
+ {"time":"2026-04-17T12:51:45.039416039+08:00","level":"INFO","msg":"handler: closed","stream_id":"3h84yfea"}
13
+ {"time":"2026-04-17T12:51:45.041478496+08:00","level":"INFO","msg":"sender: closed","stream_id":"3h84yfea"}
14
+ {"time":"2026-04-17T12:51:45.041508452+08:00","level":"INFO","msg":"stream: closed","id":"3h84yfea"}
wandb/run-20260417_123237-3h84yfea/logs/debug.log ADDED
@@ -0,0 +1,26 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ 2026-04-17 12:32:37,468 INFO MainThread:26590 [wandb_setup.py:_flush():80] Current SDK version is 0.23.0
2
+ 2026-04-17 12:32:37,468 INFO MainThread:26590 [wandb_setup.py:_flush():80] Configure stats pid to 26590
3
+ 2026-04-17 12:32:37,468 INFO MainThread:26590 [wandb_setup.py:_flush():80] Loading settings from /mnt/petrelfs/panjiabao/.config/wandb/settings
4
+ 2026-04-17 12:32:37,468 INFO MainThread:26590 [wandb_setup.py:_flush():80] Loading settings from /mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/0416upload/wandb/settings
5
+ 2026-04-17 12:32:37,468 INFO MainThread:26590 [wandb_setup.py:_flush():80] Loading settings from environment variables
6
+ 2026-04-17 12:32:37,468 INFO MainThread:26590 [wandb_init.py:setup_run_log_directory():713] Logging user logs to /mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/0416upload/wandb/run-20260417_123237-3h84yfea/logs/debug.log
7
+ 2026-04-17 12:32:37,468 INFO MainThread:26590 [wandb_init.py:setup_run_log_directory():714] Logging internal logs to /mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/0416upload/wandb/run-20260417_123237-3h84yfea/logs/debug-internal.log
8
+ 2026-04-17 12:32:37,468 INFO MainThread:26590 [wandb_init.py:init():840] calling init triggers
9
+ 2026-04-17 12:32:37,468 INFO MainThread:26590 [wandb_init.py:init():845] wandb.init called with sweep_config: {}
10
+ config: {'_wandb': {}}
11
+ 2026-04-17 12:32:37,468 INFO MainThread:26590 [wandb_init.py:init():888] starting backend
12
+ 2026-04-17 12:32:37,819 INFO MainThread:26590 [wandb_init.py:init():891] sending inform_init request
13
+ 2026-04-17 12:32:37,823 INFO MainThread:26590 [wandb_init.py:init():899] backend started and connected
14
+ 2026-04-17 12:32:37,825 INFO MainThread:26590 [wandb_init.py:init():969] updated telemetry
15
+ 2026-04-17 12:32:37,826 INFO MainThread:26590 [wandb_init.py:init():993] communicating run to backend with 90.0 second timeout
16
+ 2026-04-17 12:32:39,301 INFO MainThread:26590 [wandb_init.py:init():1040] starting run threads in backend
17
+ 2026-04-17 12:32:39,937 INFO MainThread:26590 [wandb_run.py:_console_start():2504] atexit reg
18
+ 2026-04-17 12:32:39,937 INFO MainThread:26590 [wandb_run.py:_redirect():2352] redirect: wrap_raw
19
+ 2026-04-17 12:32:39,937 INFO MainThread:26590 [wandb_run.py:_redirect():2421] Wrapping output streams.
20
+ 2026-04-17 12:32:39,937 INFO MainThread:26590 [wandb_run.py:_redirect():2444] Redirects installed.
21
+ 2026-04-17 12:32:39,944 INFO MainThread:26590 [wandb_init.py:init():1080] run started, returning control to user process
22
+ 2026-04-17 12:32:39,949 INFO MainThread:26590 [wandb_run.py:_config_callback():1385] config_cb None None {'peft_config': {'default': {'task_type': 'CAUSAL_LM', 'peft_type': 'LORA', 'auto_mapping': None, 'peft_version': '0.18.1', 'base_model_name_or_path': '/mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/qwen3-asr-merged', 'revision': None, 'inference_mode': False, 'r': 8, 'target_modules': '^(thinker\\.model(?=\\.).*\\.(up_proj|v_proj|k_proj|o_proj|q_proj|gate_proj|down_proj)|thinker\\.audio_tower\\.layers(?=\\.).*\\.(v_proj|fc2|k_proj|fc1|q_proj|out_proj)|thinker\\.audio_tower\\.conv_out(?=\\.)|thinker\\.audio_tower\\.proj1(?=\\.)|thinker\\.audio_tower\\.proj2(?=\\.))$', 'exclude_modules': None, 'lora_alpha': 32, 'lora_dropout': 0.05, 'fan_in_fan_out': False, 'bias': 'none', 'use_rslora': False, 'modules_to_save': [], 'init_lora_weights': True, 'layers_to_transform': None, 'layers_pattern': None, 'rank_pattern': {}, 'alpha_pattern': {}, 'megatron_config': None, 'megatron_core': 'megatron.core', 'trainable_token_indices': None, 'loftq_config': {}, 'eva_config': None, 'corda_config': None, 'use_dora': False, 'alora_invocation_tokens': None, 'use_qalora': False, 'qalora_group_size': 16, 'layer_replication': None, 'runtime_config': {'ephemeral_gpu_offload': False}, 'lora_bias': False, 'target_parameters': None, 'arrow_config': None, 'ensure_weight_tying': False, 'lora_dtype': None, 'lorap_lr_ratio': None, 'lorap_emb_lr': 1e-06}}, 'return_dict': True, 'output_hidden_states': False, 'torchscript': False, 'dtype': 'bfloat16', 'pruned_heads': {}, 'tie_word_embeddings': True, 'chunk_size_feed_forward': 0, 'is_encoder_decoder': False, 'is_decoder': False, 'cross_attention_hidden_size': None, 'add_cross_attention': False, 'tie_encoder_decoder': False, 'architectures': ['Qwen3ASRForConditionalGeneration'], 'finetuning_task': None, 'id2label': {0: 'LABEL_0', 1: 'LABEL_1'}, 'label2id': {'LABEL_0': 0, 'LABEL_1': 1}, 'task_specific_params': None, 'problem_type': None, 'tokenizer_class': None, 'prefix': None, 'bos_token_id': None, 'pad_token_id': 151643, 'eos_token_id': 151645, 'sep_token_id': None, 'decoder_start_token_id': None, 'max_length': 20, 'min_length': 0, 'do_sample': False, 'early_stopping': False, 'num_beams': 1, 'temperature': 0.5, 'top_k': 50, 'top_p': 0.95, 'typical_p': 1.0, 'repetition_penalty': 1.08, 'length_penalty': 1.0, 'no_repeat_ngram_size': 0, 'encoder_no_repeat_ngram_size': 0, 'bad_words_ids': None, 'num_return_sequences': 1, 'output_scores': False, 'return_dict_in_generate': False, 'forced_bos_token_id': None, 'forced_eos_token_id': None, 'remove_invalid_values': False, 'exponential_decay_length_penalty': None, 'suppress_tokens': None, 'begin_suppress_tokens': None, 'num_beam_groups': 1, 'diversity_penalty': 0.0, '_name_or_path': '/mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/qwen3-asr-merged', 'transformers_version': '4.57.6', 'model_type': 'qwen3_asr', 'tf_legacy_loss': False, 'use_bfloat16': False, 'thinker_config': {'return_dict': True, 'output_hidden_states': False, 'torchscript': False, 'dtype': 'bfloat16', 'pruned_heads': {}, 'tie_word_embeddings': True, 'chunk_size_feed_forward': 0, 'is_encoder_decoder': False, 'is_decoder': False, 'cross_attention_hidden_size': None, 'add_cross_attention': False, 'tie_encoder_decoder': False, 'architectures': ['Qwen3ASRForConditionalGeneration'], 'finetuning_task': None, 'id2label': {0: 'LABEL_0', 1: 'LABEL_1'}, 'label2id': {'LABEL_0': 0, 'LABEL_1': 1}, 'task_specific_params': None, 'problem_type': None, 'tokenizer_class': None, 'prefix': None, 'bos_token_id': None, 'pad_token_id': None, 'eos_token_id': None, 'sep_token_id': None, 'decoder_start_token_id': None, 'max_length': 20, 'min_length': 0, 'do_sample': False, 'early_stopping': False, 'num_beams': 1, 'temperature': 1.0, 'top_k': 50, 'top_p': 1.0, 'typical_p': 1.0, 'repetition_penalty': 1.0, 'length_penalty': 1.0, 'no_repeat_ngram_size': 0, 'encoder_no_repeat_ngram_size': 0, 'bad_words_ids': None, 'num_return_sequences': 1, 'output_scores': False, 'return_dict_in_generate': False, 'forced_bos_token_id': None, 'forced_eos_token_id': None, 'remove_invalid_values': False, 'exponential_decay_length_penalty': None, 'suppress_tokens': None, 'begin_suppress_tokens': None, 'num_beam_groups': 1, 'diversity_penalty': 0.0, '_name_or_path': '', 'audio_end_token_id': 151670, 'model_type': 'qwen3_asr_thinker', 'tf_legacy_loss': False, 'use_bfloat16': False, 'user_token_id': 872, 'audio_start_token_id': 151669, 'initializer_range': 0.02, 'audio_config': {'return_dict': True, 'output_hidden_states': False, 'torchscript': False, 'dtype': None, 'pruned_heads': {}, 'tie_word_embeddings': True, 'chunk_size_feed_forward': 0, 'is_encoder_decoder': False, 'is_decoder': False, 'cross_attention_hidden_size': None, 'add_cross_attention': False, 'tie_encoder_decoder': False, 'architectures': None, 'finetuning_task': None, 'id2label': {0: 'LABEL_0', 1: 'LABEL_1'}, 'label2id': {'LABEL_0': 0, 'LABEL_1': 1}, 'task_specific_params': None, 'problem_type': None, 'tokenizer_class': None, 'prefix': None, 'bos_token_id': None, 'pad_token_id': None, 'eos_token_id': None, 'sep_token_id': None, 'decoder_start_token_id': None, 'max_length': 20, 'min_length': 0, 'do_sample': False, 'early_stopping': False, 'num_beams': 1, 'temperature': 1.0, 'top_k': 50, 'top_p': 1.0, 'typical_p': 1.0, 'repetition_penalty': 1.0, 'length_penalty': 1.0, 'no_repeat_ngram_size': 0, 'encoder_no_repeat_ngram_size': 0, 'bad_words_ids': None, 'num_return_sequences': 1, 'output_scores': False, 'return_dict_in_generate': False, 'forced_bos_token_id': None, 'forced_eos_token_id': None, 'remove_invalid_values': False, 'exponential_decay_length_penalty': None, 'suppress_tokens': None, 'begin_suppress_tokens': None, 'num_beam_groups': 1, 'diversity_penalty': 0.0, '_name_or_path': '', 'model_type': 'qwen3_asr_audio_encoder', 'num_hidden_layers': 24, 'tf_legacy_loss': False, 'use_bfloat16': False, 'num_mel_bins': 128, 'd_model': 1024, 'encoder_layers': 24, 'encoder_attention_heads': 16, 'encoder_ffn_dim': 4096, 'dropout': 0, 'attention_dropout': 0, 'activation_function': 'gelu', 'activation_dropout': 0, 'initializer_range': 0.02, 'scale_embedding': False, 'max_source_positions': 1500, 'n_window': 50, 'output_dim': 2048, 'n_window_infer': 800, 'conv_chunksize': 500, 'downsample_hidden_size': 480, 'output_attentions': False}, 'text_config': {'vocab_size': 151936, 'max_position_embeddings': 65536, 'hidden_size': 2048, 'intermediate_size': 6144, 'num_hidden_layers': 28, 'num_attention_heads': 16, 'num_key_value_heads': 8, 'head_dim': 128, 'hidden_act': 'silu', 'initializer_range': 0.02, 'rms_norm_eps': 1e-06, 'use_cache': False, 'rope_theta': 1000000, 'rope_scaling': {'interleaved': True, 'mrope_interleaved': True, 'mrope_section': [24, 20, 20], 'rope_type': 'default', 'type': 'default'}, 'attention_bias': False, 'attention_dropout': 0.0, 'return_dict': True, 'output_hidden_states': False, 'torchscript': False, 'dtype': None, 'pruned_heads': {}, 'tie_word_embeddings': True, 'chunk_size_feed_forward': 0, 'is_encoder_decoder': False, 'is_decoder': False, 'cross_attention_hidden_size': None, 'add_cross_attention': False, 'tie_encoder_decoder': False, 'architectures': None, 'finetuning_task': None, 'id2label': {0: 'LABEL_0', 1: 'LABEL_1'}, 'label2id': {'LABEL_0': 0, 'LABEL_1': 1}, 'task_specific_params': None, 'problem_type': None, 'tokenizer_class': None, 'prefix': None, 'bos_token_id': None, 'pad_token_id': 151643, 'eos_token_id': None, 'sep_token_id': None, 'decoder_start_token_id': None, 'max_length': 20, 'min_length': 0, 'do_sample': False, 'early_stopping': False, 'num_beams': 1, 'temperature': 1.0, 'top_k': 50, 'top_p': 1.0, 'typical_p': 1.0, 'repetition_penalty': 1.0, 'length_penalty': 1.0, 'no_repeat_ngram_size': 0, 'encoder_no_repeat_ngram_size': 0, 'bad_words_ids': None, 'num_return_sequences': 1, 'output_scores': False, 'return_dict_in_generate': False, 'forced_bos_token_id': None, 'forced_eos_token_id': None, 'remove_invalid_values': False, 'exponential_decay_length_penalty': None, 'suppress_tokens': None, 'begin_suppress_tokens': None, 'num_beam_groups': 1, 'diversity_penalty': 0.0, '_name_or_path': '', 'model_type': 'qwen3_asr_text', 'tf_legacy_loss': False, 'use_bfloat16': False, 'output_attentions': False}, 'audio_token_id': 151676, 'output_attentions': False}, 'support_languages': ['Chinese', 'English', 'Cantonese', 'Arabic', 'German', 'French', 'Spanish', 'Portuguese', 'Indonesian', 'Italian', 'Korean', 'Russian', 'Thai', 'Vietnamese', 'Japanese', 'Turkish', 'Hindi', 'Malay', 'Dutch', 'Swedish', 'Danish', 'Finnish', 'Polish', 'Czech', 'Filipino', 'Persian', 'Greek', 'Romanian', 'Hungarian', 'Macedonian'], 'output_attentions': False, 'output_dir': '/mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/0416upload/out/qwen3asr_dapo_reward56_4x4x12_12gen_4GPU/v3-20260417-123227', 'overwrite_output_dir': False, 'do_train': False, 'do_eval': True, 'do_predict': False, 'eval_strategy': 'steps', 'prediction_loss_only': False, 'per_device_train_batch_size': 8, 'per_device_eval_batch_size': 8, 'per_gpu_train_batch_size': None, 'per_gpu_eval_batch_size': None, 'gradient_accumulation_steps': 12, 'eval_accumulation_steps': None, 'eval_delay': 0, 'torch_empty_cache_steps': None, 'learning_rate': 5e-05, 'weight_decay': 0.1, 'adam_beta1': 0.9, 'adam_beta2': 0.95, 'adam_epsilon': 1e-08, 'max_grad_norm': 1.0, 'num_train_epochs': 3.0, 'max_steps': -1, 'lr_scheduler_type': 'cosine', 'lr_scheduler_kwargs': None, 'warmup_ratio': 0.03, 'warmup_steps': 0, 'log_level': 'passive', 'log_level_replica': 'warning', 'log_on_each_node': True, 'logging_dir': '/mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/0416upload/out/qwen3asr_dapo_reward56_4x4x12_12gen_4GPU/v3-20260417-123227/runs', 'logging_strategy': 'steps', 'logging_first_step': True, 'logging_steps': 5, 'logging_nan_inf_filter': True, 'save_strategy': 'steps', 'save_steps': 20, 'save_total_limit': None, 'save_safetensors': True, 'save_on_each_node': False, 'save_only_model': False, 'restore_callback_states_from_checkpoint': False, 'no_cuda': False, 'use_cpu': False, 'use_mps_device': False, 'seed': 42, 'data_seed': 42, 'jit_mode_eval': False, 'bf16': True, 'fp16': False, 'fp16_opt_level': 'O1', 'half_precision_backend': 'auto', 'bf16_full_eval': False, 'fp16_full_eval': False, 'tf32': None, 'local_rank': 0, 'ddp_backend': None, 'tpu_num_cores': None, 'tpu_metrics_debug': False, 'debug': [], 'dataloader_drop_last': True, 'eval_steps': 20, 'dataloader_num_workers': 1, 'dataloader_prefetch_factor': 2, 'past_index': -1, 'run_name': 'qwen3asr_dapo_reward56_4x4x12_12gen_4GPU', 'disable_tqdm': False, 'remove_unused_columns': False, 'label_names': None, 'load_best_model_at_end': False, 'metric_for_best_model': 'loss', 'greater_is_better': False, 'ignore_data_skip': False, 'fsdp': [], 'fsdp_min_num_params': 0, 'fsdp_config': {'min_num_params': 0, 'xla': False, 'xla_fsdp_v2': False, 'xla_fsdp_grad_ckpt': False}, 'fsdp_transformer_layer_cls_to_wrap': None, 'accelerator_config': {'split_batches': False, 'dispatch_batches': False, 'even_batches': True, 'use_seedable_sampler': True, 'non_blocking': False, 'gradient_accumulation_kwargs': None}, 'parallelism_config': None, 'deepspeed': None, 'label_smoothing_factor': 0.0, 'optim': 'adamw_torch', 'optim_args': None, 'adafactor': False, 'group_by_length': False, 'length_column_name': 'length', 'report_to': ['wandb'], 'project': 'huggingface', 'trackio_space_id': 'trackio', 'ddp_find_unused_parameters': None, 'ddp_bucket_cap_mb': None, 'ddp_broadcast_buffers': None, 'dataloader_pin_memory': True, 'dataloader_persistent_workers': False, 'skip_memory_metrics': True, 'use_legacy_prediction_loop': False, 'push_to_hub': False, 'resume_from_checkpoint': None, 'hub_model_id': None, 'hub_strategy': 'every_save', 'hub_token': '<HUB_TOKEN>', 'hub_private_repo': None, 'hub_always_push': False, 'hub_revision': None, 'gradient_checkpointing': False, 'gradient_checkpointing_kwargs': None, 'include_inputs_for_metrics': False, 'include_for_metrics': [], 'eval_do_concat_batches': True, 'fp16_backend': 'auto', 'push_to_hub_model_id': None, 'push_to_hub_organization': None, 'push_to_hub_token': '<PUSH_TO_HUB_TOKEN>', 'mp_parameters': '', 'auto_find_batch_size': False, 'full_determinism': False, 'torchdynamo': None, 'ray_scope': 'last', 'ddp_timeout': 18000000, 'torch_compile': False, 'torch_compile_backend': None, 'torch_compile_mode': None, 'include_tokens_per_second': False, 'include_num_input_tokens_seen': 'no', 'neftune_noise_alpha': None, 'optim_target_modules': None, 'batch_eval_metrics': False, 'eval_on_start': False, 'use_liger_kernel': False, 'liger_kernel_config': None, 'eval_use_gather_object': False, 'average_tokens_across_devices': True, 'model_init_kwargs': None, 'disable_dropout': False, 'cast_lm_head_to_fp32': False, 'num_generations': 12, 'num_generations_eval': 4, 'max_completion_length': 256, 'ds3_gather_for_generation': True, 'shuffle_dataset': True, 'generation_batch_size': 48, 'steps_per_generation': 3, 'min_p': None, 'generation_kwargs': None, 'chat_template_kwargs': None, 'use_transformers_paged': False, 'cache_implementation': None, 'use_vllm': False, 'vllm_mode': None, 'vllm_model_impl': 'vllm', 'vllm_enable_sleep_mode': False, 'vllm_structured_outputs_regex': None, 'vllm_server_base_url': None, 'vllm_server_host': None, 'vllm_server_port': [8000], 'vllm_server_timeout': 240.0, 'vllm_group_port': 51216, 'vllm_gpu_memory_utilization': 0.9, 'vllm_max_model_length': None, 'vllm_tensor_parallel_size': 1, 'beta': 0.04, 'num_iterations': 2, 'epsilon': 0.2, 'delta': None, 'epsilon_high': 0.28, 'sapo_temperature_neg': 1.05, 'sapo_temperature_pos': 1.0, 'importance_sampling_level': 'token', 'reward_weights': None, 'multi_objective_aggregation': 'sum_then_normalize', 'scale_rewards': 'group', 'loss_type': 'dapo', 'mask_truncated_completions': False, 'sync_ref_model': False, 'ref_model_mixup_alpha': 0.6, 'ref_model_sync_steps': 512, 'top_entropy_quantile': 1.0, 'max_tool_calling_iterations': None, 'vllm_importance_sampling_correction': True, 'vllm_importance_sampling_mode': 'sequence_mask', 'vllm_importance_sampling_cap': 3.0, 'off_policy_mask_threshold': None, 'use_bias_correction_kl': False, 'log_completions': True, 'num_completions_to_print': None, 'log_unique_prompts': False, 'log_completions_hub_repo': None, 'tuner_backend': 'peft', 'vit_gradient_checkpointing': True, 'router_aux_loss_coef': 0.0, 'enable_dft_loss': False, 'enable_channel_loss': False, 'safe_serialization': True, 'max_shard_size': '5GB', 'check_model': True, 'acc_strategy': 'token', 'train_dataloader_shuffle': True, 'max_epochs': None, 'aligner_lr': None, 'vit_lr': None, 'use_logits_to_keep': None, 'resume_only_model': False, 'optimizer': None, 'eval_metric': None, 'callbacks': [], 'early_stop_interval': None, 'eval_use_evalscope': False, 'eval_dataset': [], 'eval_dataset_args': None, 'eval_limit': None, 'eval_generation_config': None, 'extra_eval_args': None, 'tuner_type': 'lora', 'use_galore': False, 'galore_target_modules': None, 'galore_rank': 128, 'galore_update_proj_gap': 50, 'galore_scale': 1.0, 'galore_proj_type': 'std', 'galore_optim_per_parameter': False, 'galore_with_embedding': False, 'galore_quantization': False, 'galore_proj_quant': False, 'galore_proj_bits': 4, 'galore_proj_group_size': 256, 'galore_cos_threshold': 0.4, 'galore_gamma_proj': 2, 'galore_queue_size': 5, 'lisa_activated_layers': 0, 'lisa_step_interval': 20, 'use_flash_ckpt': False, 'vllm_pipeline_parallel_size': 1, 'vllm_enable_expert_parallel': False, 'vllm_max_num_seqs': None, 'vllm_max_model_len': None, 'vllm_disable_custom_all_reduce': True, 'vllm_enforce_eager': False, 'vllm_limit_mm_per_prompt': None, 'vllm_max_lora_rank': 16, 'vllm_enable_prefix_caching': True, 'vllm_use_async_engine': None, 'vllm_quantization': None, 'vllm_reasoning_parser': None, 'vllm_disable_cascade_attn': False, 'vllm_mm_processor_cache_gb': None, 'vllm_speculative_config': None, 'vllm_engine_kwargs': {}, 'vllm_data_parallel_size': 1, 'stop_words': [], 'vllm_enable_lora': False, 'lora_rank': 8, 'vllm_server_group_port': None, 'enable_flattened_weight_sync': True, 'async_generate': False, 'structured_outputs_regex': None, 'sleep_level': 0, 'move_model_batches': None, 'offload_optimizer': False, 'offload_model': False, 'wandb_log_unique_prompts': None, 'cosine_min_len_value_wrong': -0.5, 'cosine_max_len_value_wrong': 0.0, 'cosine_min_len_value_correct': 1.0, 'cosine_max_len_value_correct': 0.5, 'cosine_max_len': 256, 'repetition_n_grams': 3, 'repetition_max_penalty': -1.0, 'reward_model': None, 'reward_model_plugin': None, 'chord_sft_dataset': [], 'chord_sft_per_device_train_batch_size': None, 'chord_enable_phi_function': False, 'chord_mu_warmup_steps': None, 'chord_mu_decay_steps': None, 'chord_mu_peak': None, 'chord_mu_valley': None, 'multi_turn_scheduler': None, 'max_turns': None, 'completion_length_limit_scope': 'per_round', 'vllm_server_pass_dataset': False, 'dynamic_sample': True, 'max_resample_times': 4, 'overlong_filter': True, 'soft_max_length': None, 'soft_cache_length': None, 'log_entropy': False, 'tau_pos': 1.0, 'tau_neg': 1.05, 'advantage_estimator': 'grpo', 'kl_in_reward': False, 'dataset_shuffle': True, 'rollout_importance_sampling_mode': None, 'rollout_importance_sampling_threshold': 2.0, 'log_rollout_offpolicy_metrics': False, 'off_policy_sequence_mask_delta': None}
23
+ 2026-04-17 12:32:39,959 INFO MainThread:26590 [wandb_config.py:__setitem__():154] [no run ID] config set model/num_parameters = 2050307712 - <bound method Run._config_callback of <wandb.sdk.wandb_run.Run object at 0x7f553c81a9e0>>
24
+ 2026-04-17 12:32:39,959 INFO MainThread:26590 [wandb_run.py:_config_callback():1385] config_cb model/num_parameters 2050307712 None
25
+ 2026-04-17 12:51:08,851 INFO wandb-AsyncioManager-main:26590 [service_client.py:_forward_responses():80] Reached EOF.
26
+ 2026-04-17 12:51:08,851 INFO wandb-AsyncioManager-main:26590 [mailbox.py:close():137] Closing mailbox, abandoning 1 handles.
wandb/run-20260417_125349-3c0s7mq3/files/config.yaml ADDED
@@ -0,0 +1,1273 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ _name_or_path:
2
+ value: /mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/qwen3-asr-merged
3
+ _wandb:
4
+ value:
5
+ cli_version: 0.23.0
6
+ e:
7
+ j5sm4ok14e8glxftszvcldkdpfaj9tjk:
8
+ args:
9
+ - --rlhf_type
10
+ - grpo
11
+ - --external_plugins
12
+ - /mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/0416upload/my_qwen3_asr_dapo_register.py
13
+ - /mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/0416upload/0417_reward.py
14
+ - --model
15
+ - /mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/qwen3-asr-merged
16
+ - --model_type
17
+ - my_qwen3_asr_rl
18
+ - --template
19
+ - my_qwen3_asr_rl
20
+ - --dataset
21
+ - /mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/0416upload/lora_0323_10w+55w+error+syn_with_domain_train90_targeted_rl_train90_loramerged_basewer_3suppress_server.jsonl
22
+ - --val_dataset
23
+ - /mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/0416upload/lora_0323_10w+55w+error+syn_with_domain_train90_targeted_rl_val5_sample5p_server.jsonl
24
+ - --reward_funcs
25
+ - asr_wer_sub_len_cmp_hallu_dirty_v56
26
+ - --train_type
27
+ - lora
28
+ - --use_vllm
29
+ - "false"
30
+ - --log_completions
31
+ - "true"
32
+ - --loss_type
33
+ - dapo
34
+ - --advantage_estimator
35
+ - grpo
36
+ - --scale_rewards
37
+ - group
38
+ - --num_iterations
39
+ - "2"
40
+ - --beta
41
+ - "0.04"
42
+ - --epsilon_high
43
+ - "0.28"
44
+ - --dynamic_sample
45
+ - "true"
46
+ - --max_resample_times
47
+ - "4"
48
+ - --overlong_filter
49
+ - "true"
50
+ - --truncation_strategy
51
+ - delete
52
+ - --num_generations
53
+ - "12"
54
+ - --generation_batch_size
55
+ - "48"
56
+ - --per_device_train_batch_size
57
+ - "4"
58
+ - --per_device_eval_batch_size
59
+ - "4"
60
+ - --gradient_accumulation_steps
61
+ - "12"
62
+ - --num_generations_eval
63
+ - "4"
64
+ - --max_completion_length
65
+ - "256"
66
+ - --temperature
67
+ - "0.50"
68
+ - --top_p
69
+ - "0.95"
70
+ - --top_k
71
+ - "50"
72
+ - --repetition_penalty
73
+ - "1.08"
74
+ - --learning_rate
75
+ - "5e-5"
76
+ - --lr_scheduler_type
77
+ - cosine
78
+ - --warmup_ratio
79
+ - "0.03"
80
+ - --report_to
81
+ - wandb
82
+ - --run_name
83
+ - qwen3asr_dapo_reward56_4x4x12_12gen_4GPU
84
+ - --output_dir
85
+ - /mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/0416upload/out/qwen3asr_dapo_reward56_4x4x12_12gen_4GPU
86
+ - --save_strategy
87
+ - steps
88
+ - --save_steps
89
+ - "20"
90
+ - --logging_steps
91
+ - "5"
92
+ - --freeze_llm
93
+ - "false"
94
+ - --freeze_vit
95
+ - "false"
96
+ - --freeze_aligner
97
+ - "false"
98
+ - --remove_unused_columns
99
+ - "false"
100
+ - --padding_side
101
+ - left
102
+ cpu_count: 64
103
+ cpu_count_logical: 128
104
+ cudaVersion: "12.4"
105
+ disk:
106
+ /:
107
+ total: "524945911808"
108
+ used: "49879580672"
109
+ email: pang_kaiyu@163.com
110
+ executable: /mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/bin/python3.10
111
+ gpu: NVIDIA A100-SXM4-80GB
112
+ gpu_count: 8
113
+ gpu_nvidia:
114
+ - architecture: Ampere
115
+ cudaCores: 6912
116
+ memoryTotal: "85899345920"
117
+ name: NVIDIA A100-SXM4-80GB
118
+ uuid: GPU-3da6624c-f6f7-fce6-4711-27acab73dc93
119
+ - architecture: Ampere
120
+ cudaCores: 6912
121
+ memoryTotal: "85899345920"
122
+ name: NVIDIA A100-SXM4-80GB
123
+ uuid: GPU-dae83544-a631-a3fe-b5d5-e4fdd056c7a8
124
+ - architecture: Ampere
125
+ cudaCores: 6912
126
+ memoryTotal: "85899345920"
127
+ name: NVIDIA A100-SXM4-80GB
128
+ uuid: GPU-621aa0b9-4a32-d349-8a16-20b8b6f0dde4
129
+ - architecture: Ampere
130
+ cudaCores: 6912
131
+ memoryTotal: "85899345920"
132
+ name: NVIDIA A100-SXM4-80GB
133
+ uuid: GPU-642bed5e-3bf1-b5e0-8aba-33f8f64a5dcc
134
+ - architecture: Ampere
135
+ cudaCores: 6912
136
+ memoryTotal: "85899345920"
137
+ name: NVIDIA A100-SXM4-80GB
138
+ uuid: GPU-6c70bd3b-1e58-bd2a-a10b-19891e3eab9a
139
+ - architecture: Ampere
140
+ cudaCores: 6912
141
+ memoryTotal: "85899345920"
142
+ name: NVIDIA A100-SXM4-80GB
143
+ uuid: GPU-96e9e2d3-6436-3c7f-5a20-1d4a32e7992c
144
+ - architecture: Ampere
145
+ cudaCores: 6912
146
+ memoryTotal: "85899345920"
147
+ name: NVIDIA A100-SXM4-80GB
148
+ uuid: GPU-dba7546f-0cda-e659-ca1d-4790c27ffe8d
149
+ - architecture: Ampere
150
+ cudaCores: 6912
151
+ memoryTotal: "85899345920"
152
+ name: NVIDIA A100-SXM4-80GB
153
+ uuid: GPU-b0a96cf9-74f3-969a-e8d0-5a30f3f06d1e
154
+ host: SH-IDC1-10-140-37-28
155
+ memory:
156
+ total: "1081627828224"
157
+ os: Linux-3.10.0-957.el7.x86_64-x86_64-with-glibc2.17
158
+ program: /mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/lib/python3.10/site-packages/swift/cli/rlhf.py
159
+ python: CPython 3.10.18
160
+ root: /mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/0416upload
161
+ slurm:
162
+ cluster_name: cluster_sproject3
163
+ conf: /etc/slurm/slurm.conf
164
+ cpus_on_node: "2"
165
+ gtids: "0"
166
+ job_account: research
167
+ job_cpus_per_node: "2"
168
+ job_gid: "800000689"
169
+ job_id: "8568855"
170
+ job_name: qwen3_asr_train_4gpu
171
+ job_nodelist: SH-IDC1-10-140-37-28
172
+ job_num_nodes: "1"
173
+ job_partition: interntmp
174
+ job_qos: normal
175
+ job_uid: "800000689"
176
+ job_user: panjiabao
177
+ jobid: "8568855"
178
+ launch_node_ipaddr: 10.140.37.164
179
+ localid: "0"
180
+ nnodes: "1"
181
+ nodeid: "0"
182
+ nodelist: SH-IDC1-10-140-37-28
183
+ nprocs: "1"
184
+ ntasks: "1"
185
+ ntasks_per_node: "1"
186
+ prio_process: "0"
187
+ procid: "0"
188
+ srun_comm_host: 10.140.37.164
189
+ srun_comm_port: "39944"
190
+ step_gpus: 4,5,6,7
191
+ step_id: "0"
192
+ step_launcher_port: "39944"
193
+ step_nodelist: SH-IDC1-10-140-37-28
194
+ step_num_nodes: "1"
195
+ step_num_tasks: "1"
196
+ step_tasks_per_node: "1"
197
+ stepid: "0"
198
+ submit_dir: /mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/0416upload
199
+ submit_host: SH-IDC1-10-140-37-164
200
+ task_pid: "253884"
201
+ tasks_per_node: "1"
202
+ topology_addr: SH-IDC1-10-140-37-28
203
+ topology_addr_pattern: node
204
+ umask: "0002"
205
+ working_cluster: cluster_sproject3:SH-IDC1-10-140-37-161:6817:9216:109
206
+ startedAt: "2026-04-17T04:53:49.174280Z"
207
+ writerId: j5sm4ok14e8glxftszvcldkdpfaj9tjk
208
+ m:
209
+ - "1": train/global_step
210
+ "6":
211
+ - 3
212
+ "7": []
213
+ - "2": '*'
214
+ "5": 1
215
+ "6":
216
+ - 1
217
+ "7": []
218
+ python_version: 3.10.18
219
+ t:
220
+ "1":
221
+ - 1
222
+ - 5
223
+ - 11
224
+ - 30
225
+ - 41
226
+ - 49
227
+ - 51
228
+ - 53
229
+ - 71
230
+ - 84
231
+ - 95
232
+ - 98
233
+ - 105
234
+ "2":
235
+ - 1
236
+ - 5
237
+ - 11
238
+ - 30
239
+ - 41
240
+ - 49
241
+ - 51
242
+ - 53
243
+ - 71
244
+ - 84
245
+ - 95
246
+ - 98
247
+ - 105
248
+ "3":
249
+ - 7
250
+ - 13
251
+ - 19
252
+ - 66
253
+ "4": 3.10.18
254
+ "5": 0.23.0
255
+ "6": 4.57.6
256
+ "9":
257
+ "1": transformers_trainer
258
+ "12": 0.23.0
259
+ "13": linux-x86_64
260
+ acc_strategy:
261
+ value: token
262
+ accelerator_config:
263
+ value:
264
+ dispatch_batches: false
265
+ even_batches: true
266
+ gradient_accumulation_kwargs: null
267
+ non_blocking: false
268
+ split_batches: false
269
+ use_seedable_sampler: true
270
+ adafactor:
271
+ value: false
272
+ adam_beta1:
273
+ value: 0.9
274
+ adam_beta2:
275
+ value: 0.95
276
+ adam_epsilon:
277
+ value: 1e-08
278
+ add_cross_attention:
279
+ value: false
280
+ advantage_estimator:
281
+ value: grpo
282
+ aligner_lr:
283
+ value: null
284
+ architectures:
285
+ value:
286
+ - Qwen3ASRForConditionalGeneration
287
+ async_generate:
288
+ value: false
289
+ auto_find_batch_size:
290
+ value: false
291
+ average_tokens_across_devices:
292
+ value: true
293
+ bad_words_ids:
294
+ value: null
295
+ batch_eval_metrics:
296
+ value: false
297
+ begin_suppress_tokens:
298
+ value: null
299
+ beta:
300
+ value: 0.04
301
+ bf16:
302
+ value: true
303
+ bf16_full_eval:
304
+ value: false
305
+ bos_token_id:
306
+ value: null
307
+ cache_implementation:
308
+ value: null
309
+ callbacks:
310
+ value: []
311
+ cast_lm_head_to_fp32:
312
+ value: false
313
+ chat_template_kwargs:
314
+ value: null
315
+ check_model:
316
+ value: true
317
+ chord_enable_phi_function:
318
+ value: false
319
+ chord_mu_decay_steps:
320
+ value: null
321
+ chord_mu_peak:
322
+ value: null
323
+ chord_mu_valley:
324
+ value: null
325
+ chord_mu_warmup_steps:
326
+ value: null
327
+ chord_sft_dataset:
328
+ value: []
329
+ chord_sft_per_device_train_batch_size:
330
+ value: null
331
+ chunk_size_feed_forward:
332
+ value: 0
333
+ completion_length_limit_scope:
334
+ value: per_round
335
+ cosine_max_len:
336
+ value: 256
337
+ cosine_max_len_value_correct:
338
+ value: 0.5
339
+ cosine_max_len_value_wrong:
340
+ value: 0
341
+ cosine_min_len_value_correct:
342
+ value: 1
343
+ cosine_min_len_value_wrong:
344
+ value: -0.5
345
+ cross_attention_hidden_size:
346
+ value: null
347
+ data_seed:
348
+ value: 42
349
+ dataloader_drop_last:
350
+ value: true
351
+ dataloader_num_workers:
352
+ value: 1
353
+ dataloader_persistent_workers:
354
+ value: false
355
+ dataloader_pin_memory:
356
+ value: true
357
+ dataloader_prefetch_factor:
358
+ value: 2
359
+ dataset_shuffle:
360
+ value: true
361
+ ddp_backend:
362
+ value: null
363
+ ddp_broadcast_buffers:
364
+ value: null
365
+ ddp_bucket_cap_mb:
366
+ value: null
367
+ ddp_find_unused_parameters:
368
+ value: null
369
+ ddp_timeout:
370
+ value: 18000000
371
+ debug:
372
+ value: []
373
+ decoder_start_token_id:
374
+ value: null
375
+ deepspeed:
376
+ value: null
377
+ delta:
378
+ value: null
379
+ disable_dropout:
380
+ value: false
381
+ disable_tqdm:
382
+ value: false
383
+ diversity_penalty:
384
+ value: 0
385
+ do_eval:
386
+ value: true
387
+ do_predict:
388
+ value: false
389
+ do_sample:
390
+ value: false
391
+ do_train:
392
+ value: false
393
+ ds3_gather_for_generation:
394
+ value: true
395
+ dtype:
396
+ value: bfloat16
397
+ dynamic_sample:
398
+ value: true
399
+ early_stop_interval:
400
+ value: null
401
+ early_stopping:
402
+ value: false
403
+ enable_channel_loss:
404
+ value: false
405
+ enable_dft_loss:
406
+ value: false
407
+ enable_flattened_weight_sync:
408
+ value: true
409
+ encoder_no_repeat_ngram_size:
410
+ value: 0
411
+ eos_token_id:
412
+ value: 151645
413
+ epsilon:
414
+ value: 0.2
415
+ epsilon_high:
416
+ value: 0.28
417
+ eval_accumulation_steps:
418
+ value: null
419
+ eval_dataset:
420
+ value: []
421
+ eval_dataset_args:
422
+ value: null
423
+ eval_delay:
424
+ value: 0
425
+ eval_do_concat_batches:
426
+ value: true
427
+ eval_generation_config:
428
+ value: null
429
+ eval_limit:
430
+ value: null
431
+ eval_metric:
432
+ value: null
433
+ eval_on_start:
434
+ value: false
435
+ eval_steps:
436
+ value: 20
437
+ eval_strategy:
438
+ value: steps
439
+ eval_use_evalscope:
440
+ value: false
441
+ eval_use_gather_object:
442
+ value: false
443
+ exponential_decay_length_penalty:
444
+ value: null
445
+ extra_eval_args:
446
+ value: null
447
+ finetuning_task:
448
+ value: null
449
+ forced_bos_token_id:
450
+ value: null
451
+ forced_eos_token_id:
452
+ value: null
453
+ fp16:
454
+ value: false
455
+ fp16_backend:
456
+ value: auto
457
+ fp16_full_eval:
458
+ value: false
459
+ fp16_opt_level:
460
+ value: O1
461
+ fsdp:
462
+ value: []
463
+ fsdp_config:
464
+ value:
465
+ min_num_params: 0
466
+ xla: false
467
+ xla_fsdp_grad_ckpt: false
468
+ xla_fsdp_v2: false
469
+ fsdp_min_num_params:
470
+ value: 0
471
+ fsdp_transformer_layer_cls_to_wrap:
472
+ value: null
473
+ full_determinism:
474
+ value: false
475
+ galore_cos_threshold:
476
+ value: 0.4
477
+ galore_gamma_proj:
478
+ value: 2
479
+ galore_optim_per_parameter:
480
+ value: false
481
+ galore_proj_bits:
482
+ value: 4
483
+ galore_proj_group_size:
484
+ value: 256
485
+ galore_proj_quant:
486
+ value: false
487
+ galore_proj_type:
488
+ value: std
489
+ galore_quantization:
490
+ value: false
491
+ galore_queue_size:
492
+ value: 5
493
+ galore_rank:
494
+ value: 128
495
+ galore_scale:
496
+ value: 1
497
+ galore_target_modules:
498
+ value: null
499
+ galore_update_proj_gap:
500
+ value: 50
501
+ galore_with_embedding:
502
+ value: false
503
+ generation_batch_size:
504
+ value: 48
505
+ generation_kwargs:
506
+ value: null
507
+ gradient_accumulation_steps:
508
+ value: 12
509
+ gradient_checkpointing:
510
+ value: false
511
+ gradient_checkpointing_kwargs:
512
+ value: null
513
+ greater_is_better:
514
+ value: false
515
+ group_by_length:
516
+ value: false
517
+ half_precision_backend:
518
+ value: auto
519
+ hub_always_push:
520
+ value: false
521
+ hub_model_id:
522
+ value: null
523
+ hub_private_repo:
524
+ value: null
525
+ hub_revision:
526
+ value: null
527
+ hub_strategy:
528
+ value: every_save
529
+ hub_token:
530
+ value: <HUB_TOKEN>
531
+ id2label:
532
+ value:
533
+ "0": LABEL_0
534
+ "1": LABEL_1
535
+ ignore_data_skip:
536
+ value: false
537
+ importance_sampling_level:
538
+ value: token
539
+ include_for_metrics:
540
+ value: []
541
+ include_inputs_for_metrics:
542
+ value: false
543
+ include_num_input_tokens_seen:
544
+ value: "no"
545
+ include_tokens_per_second:
546
+ value: false
547
+ is_decoder:
548
+ value: false
549
+ is_encoder_decoder:
550
+ value: false
551
+ jit_mode_eval:
552
+ value: false
553
+ kl_in_reward:
554
+ value: false
555
+ label_names:
556
+ value: null
557
+ label_smoothing_factor:
558
+ value: 0
559
+ label2id:
560
+ value:
561
+ LABEL_0: 0
562
+ LABEL_1: 1
563
+ learning_rate:
564
+ value: 5e-05
565
+ length_column_name:
566
+ value: length
567
+ length_penalty:
568
+ value: 1
569
+ liger_kernel_config:
570
+ value: null
571
+ lisa_activated_layers:
572
+ value: 0
573
+ lisa_step_interval:
574
+ value: 20
575
+ load_best_model_at_end:
576
+ value: false
577
+ local_rank:
578
+ value: 0
579
+ log_completions:
580
+ value: true
581
+ log_completions_hub_repo:
582
+ value: null
583
+ log_entropy:
584
+ value: false
585
+ log_level:
586
+ value: passive
587
+ log_level_replica:
588
+ value: warning
589
+ log_on_each_node:
590
+ value: true
591
+ log_rollout_offpolicy_metrics:
592
+ value: false
593
+ log_unique_prompts:
594
+ value: false
595
+ logging_dir:
596
+ value: /mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/0416upload/out/qwen3asr_dapo_reward56_4x4x12_12gen_4GPU/v4-20260417-125332/runs
597
+ logging_first_step:
598
+ value: true
599
+ logging_nan_inf_filter:
600
+ value: true
601
+ logging_steps:
602
+ value: 5
603
+ logging_strategy:
604
+ value: steps
605
+ lora_rank:
606
+ value: 8
607
+ loss_type:
608
+ value: dapo
609
+ lr_scheduler_kwargs:
610
+ value: null
611
+ lr_scheduler_type:
612
+ value: cosine
613
+ mask_truncated_completions:
614
+ value: false
615
+ max_completion_length:
616
+ value: 256
617
+ max_epochs:
618
+ value: null
619
+ max_grad_norm:
620
+ value: 1
621
+ max_length:
622
+ value: 20
623
+ max_resample_times:
624
+ value: 4
625
+ max_shard_size:
626
+ value: 5GB
627
+ max_steps:
628
+ value: -1
629
+ max_tool_calling_iterations:
630
+ value: null
631
+ max_turns:
632
+ value: null
633
+ metric_for_best_model:
634
+ value: loss
635
+ min_length:
636
+ value: 0
637
+ min_p:
638
+ value: null
639
+ model/num_parameters:
640
+ value: 2050307712
641
+ model_init_kwargs:
642
+ value: null
643
+ model_type:
644
+ value: qwen3_asr
645
+ move_model_batches:
646
+ value: null
647
+ mp_parameters:
648
+ value: ""
649
+ multi_objective_aggregation:
650
+ value: sum_then_normalize
651
+ multi_turn_scheduler:
652
+ value: null
653
+ neftune_noise_alpha:
654
+ value: null
655
+ no_cuda:
656
+ value: false
657
+ no_repeat_ngram_size:
658
+ value: 0
659
+ num_beam_groups:
660
+ value: 1
661
+ num_beams:
662
+ value: 1
663
+ num_completions_to_print:
664
+ value: null
665
+ num_generations:
666
+ value: 12
667
+ num_generations_eval:
668
+ value: 4
669
+ num_iterations:
670
+ value: 2
671
+ num_return_sequences:
672
+ value: 1
673
+ num_train_epochs:
674
+ value: 3
675
+ off_policy_mask_threshold:
676
+ value: null
677
+ off_policy_sequence_mask_delta:
678
+ value: null
679
+ offload_model:
680
+ value: false
681
+ offload_optimizer:
682
+ value: false
683
+ optim:
684
+ value: adamw_torch
685
+ optim_args:
686
+ value: null
687
+ optim_target_modules:
688
+ value: null
689
+ optimizer:
690
+ value: null
691
+ output_attentions:
692
+ value: false
693
+ output_dir:
694
+ value: /mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/0416upload/out/qwen3asr_dapo_reward56_4x4x12_12gen_4GPU/v4-20260417-125332
695
+ output_hidden_states:
696
+ value: false
697
+ output_scores:
698
+ value: false
699
+ overlong_filter:
700
+ value: true
701
+ overwrite_output_dir:
702
+ value: false
703
+ pad_token_id:
704
+ value: 151643
705
+ parallelism_config:
706
+ value: null
707
+ past_index:
708
+ value: -1
709
+ peft_config:
710
+ value:
711
+ default:
712
+ alora_invocation_tokens: null
713
+ arrow_config: null
714
+ auto_mapping: null
715
+ base_model_name_or_path: /mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/qwen3-asr-merged
716
+ bias: none
717
+ corda_config: null
718
+ ensure_weight_tying: false
719
+ eva_config: null
720
+ exclude_modules: null
721
+ fan_in_fan_out: false
722
+ inference_mode: false
723
+ init_lora_weights: true
724
+ layer_replication: null
725
+ layers_pattern: null
726
+ layers_to_transform: null
727
+ lora_alpha: 32
728
+ lora_bias: false
729
+ lora_dropout: 0.05
730
+ lora_dtype: null
731
+ lorap_emb_lr: 1e-06
732
+ lorap_lr_ratio: null
733
+ megatron_config: null
734
+ megatron_core: megatron.core
735
+ modules_to_save: []
736
+ peft_type: LORA
737
+ peft_version: 0.18.1
738
+ qalora_group_size: 16
739
+ r: 8
740
+ revision: null
741
+ runtime_config:
742
+ ephemeral_gpu_offload: false
743
+ target_modules: ^(thinker\.model(?=\.).*\.(k_proj|q_proj|down_proj|up_proj|v_proj|gate_proj|o_proj)|thinker\.audio_tower\.layers(?=\.).*\.(k_proj|fc1|fc2|q_proj|out_proj|v_proj)|thinker\.audio_tower\.conv_out(?=\.)|thinker\.audio_tower\.proj1(?=\.)|thinker\.audio_tower\.proj2(?=\.))$
744
+ target_parameters: null
745
+ task_type: CAUSAL_LM
746
+ trainable_token_indices: null
747
+ use_dora: false
748
+ use_qalora: false
749
+ use_rslora: false
750
+ per_device_eval_batch_size:
751
+ value: 4
752
+ per_device_train_batch_size:
753
+ value: 4
754
+ per_gpu_eval_batch_size:
755
+ value: null
756
+ per_gpu_train_batch_size:
757
+ value: null
758
+ prediction_loss_only:
759
+ value: false
760
+ prefix:
761
+ value: null
762
+ problem_type:
763
+ value: null
764
+ project:
765
+ value: huggingface
766
+ push_to_hub:
767
+ value: false
768
+ push_to_hub_model_id:
769
+ value: null
770
+ push_to_hub_organization:
771
+ value: null
772
+ push_to_hub_token:
773
+ value: <PUSH_TO_HUB_TOKEN>
774
+ ray_scope:
775
+ value: last
776
+ ref_model_mixup_alpha:
777
+ value: 0.6
778
+ ref_model_sync_steps:
779
+ value: 512
780
+ remove_invalid_values:
781
+ value: false
782
+ remove_unused_columns:
783
+ value: false
784
+ repetition_max_penalty:
785
+ value: -1
786
+ repetition_n_grams:
787
+ value: 3
788
+ repetition_penalty:
789
+ value: 1.08
790
+ report_to:
791
+ value:
792
+ - wandb
793
+ restore_callback_states_from_checkpoint:
794
+ value: false
795
+ resume_from_checkpoint:
796
+ value: null
797
+ resume_only_model:
798
+ value: false
799
+ return_dict:
800
+ value: true
801
+ return_dict_in_generate:
802
+ value: false
803
+ reward_model:
804
+ value: null
805
+ reward_model_plugin:
806
+ value: null
807
+ reward_weights:
808
+ value: null
809
+ rollout_importance_sampling_mode:
810
+ value: null
811
+ rollout_importance_sampling_threshold:
812
+ value: 2
813
+ router_aux_loss_coef:
814
+ value: 0
815
+ run_name:
816
+ value: qwen3asr_dapo_reward56_4x4x12_12gen_4GPU
817
+ safe_serialization:
818
+ value: true
819
+ sapo_temperature_neg:
820
+ value: 1.05
821
+ sapo_temperature_pos:
822
+ value: 1
823
+ save_on_each_node:
824
+ value: false
825
+ save_only_model:
826
+ value: false
827
+ save_safetensors:
828
+ value: true
829
+ save_steps:
830
+ value: 20
831
+ save_strategy:
832
+ value: steps
833
+ save_total_limit:
834
+ value: null
835
+ scale_rewards:
836
+ value: group
837
+ seed:
838
+ value: 42
839
+ sep_token_id:
840
+ value: null
841
+ shuffle_dataset:
842
+ value: true
843
+ skip_memory_metrics:
844
+ value: true
845
+ sleep_level:
846
+ value: 0
847
+ soft_cache_length:
848
+ value: null
849
+ soft_max_length:
850
+ value: null
851
+ steps_per_generation:
852
+ value: 3
853
+ stop_words:
854
+ value: []
855
+ structured_outputs_regex:
856
+ value: null
857
+ support_languages:
858
+ value:
859
+ - Chinese
860
+ - English
861
+ - Cantonese
862
+ - Arabic
863
+ - German
864
+ - French
865
+ - Spanish
866
+ - Portuguese
867
+ - Indonesian
868
+ - Italian
869
+ - Korean
870
+ - Russian
871
+ - Thai
872
+ - Vietnamese
873
+ - Japanese
874
+ - Turkish
875
+ - Hindi
876
+ - Malay
877
+ - Dutch
878
+ - Swedish
879
+ - Danish
880
+ - Finnish
881
+ - Polish
882
+ - Czech
883
+ - Filipino
884
+ - Persian
885
+ - Greek
886
+ - Romanian
887
+ - Hungarian
888
+ - Macedonian
889
+ suppress_tokens:
890
+ value: null
891
+ sync_ref_model:
892
+ value: false
893
+ task_specific_params:
894
+ value: null
895
+ tau_neg:
896
+ value: 1.05
897
+ tau_pos:
898
+ value: 1
899
+ temperature:
900
+ value: 0.5
901
+ tf_legacy_loss:
902
+ value: false
903
+ tf32:
904
+ value: null
905
+ thinker_config:
906
+ value:
907
+ _name_or_path: ""
908
+ add_cross_attention: false
909
+ architectures:
910
+ - Qwen3ASRForConditionalGeneration
911
+ audio_config:
912
+ _name_or_path: ""
913
+ activation_dropout: 0
914
+ activation_function: gelu
915
+ add_cross_attention: false
916
+ architectures: null
917
+ attention_dropout: 0
918
+ bad_words_ids: null
919
+ begin_suppress_tokens: null
920
+ bos_token_id: null
921
+ chunk_size_feed_forward: 0
922
+ conv_chunksize: 500
923
+ cross_attention_hidden_size: null
924
+ d_model: 1024
925
+ decoder_start_token_id: null
926
+ diversity_penalty: 0
927
+ do_sample: false
928
+ downsample_hidden_size: 480
929
+ dropout: 0
930
+ dtype: null
931
+ early_stopping: false
932
+ encoder_attention_heads: 16
933
+ encoder_ffn_dim: 4096
934
+ encoder_layers: 24
935
+ encoder_no_repeat_ngram_size: 0
936
+ eos_token_id: null
937
+ exponential_decay_length_penalty: null
938
+ finetuning_task: null
939
+ forced_bos_token_id: null
940
+ forced_eos_token_id: null
941
+ id2label:
942
+ "0": LABEL_0
943
+ "1": LABEL_1
944
+ initializer_range: 0.02
945
+ is_decoder: false
946
+ is_encoder_decoder: false
947
+ label2id:
948
+ LABEL_0: 0
949
+ LABEL_1: 1
950
+ length_penalty: 1
951
+ max_length: 20
952
+ max_source_positions: 1500
953
+ min_length: 0
954
+ model_type: qwen3_asr_audio_encoder
955
+ n_window: 50
956
+ n_window_infer: 800
957
+ no_repeat_ngram_size: 0
958
+ num_beam_groups: 1
959
+ num_beams: 1
960
+ num_hidden_layers: 24
961
+ num_mel_bins: 128
962
+ num_return_sequences: 1
963
+ output_attentions: false
964
+ output_dim: 2048
965
+ output_hidden_states: false
966
+ output_scores: false
967
+ pad_token_id: null
968
+ prefix: null
969
+ problem_type: null
970
+ remove_invalid_values: false
971
+ repetition_penalty: 1
972
+ return_dict: true
973
+ return_dict_in_generate: false
974
+ scale_embedding: false
975
+ sep_token_id: null
976
+ suppress_tokens: null
977
+ task_specific_params: null
978
+ temperature: 1
979
+ tf_legacy_loss: false
980
+ tie_encoder_decoder: false
981
+ tie_word_embeddings: true
982
+ tokenizer_class: null
983
+ top_k: 50
984
+ top_p: 1
985
+ torchscript: false
986
+ typical_p: 1
987
+ use_bfloat16: false
988
+ audio_end_token_id: 151670
989
+ audio_start_token_id: 151669
990
+ audio_token_id: 151676
991
+ bad_words_ids: null
992
+ begin_suppress_tokens: null
993
+ bos_token_id: null
994
+ chunk_size_feed_forward: 0
995
+ cross_attention_hidden_size: null
996
+ decoder_start_token_id: null
997
+ diversity_penalty: 0
998
+ do_sample: false
999
+ dtype: bfloat16
1000
+ early_stopping: false
1001
+ encoder_no_repeat_ngram_size: 0
1002
+ eos_token_id: null
1003
+ exponential_decay_length_penalty: null
1004
+ finetuning_task: null
1005
+ forced_bos_token_id: null
1006
+ forced_eos_token_id: null
1007
+ id2label:
1008
+ "0": LABEL_0
1009
+ "1": LABEL_1
1010
+ initializer_range: 0.02
1011
+ is_decoder: false
1012
+ is_encoder_decoder: false
1013
+ label2id:
1014
+ LABEL_0: 0
1015
+ LABEL_1: 1
1016
+ length_penalty: 1
1017
+ max_length: 20
1018
+ min_length: 0
1019
+ model_type: qwen3_asr_thinker
1020
+ no_repeat_ngram_size: 0
1021
+ num_beam_groups: 1
1022
+ num_beams: 1
1023
+ num_return_sequences: 1
1024
+ output_attentions: false
1025
+ output_hidden_states: false
1026
+ output_scores: false
1027
+ pad_token_id: null
1028
+ prefix: null
1029
+ problem_type: null
1030
+ remove_invalid_values: false
1031
+ repetition_penalty: 1
1032
+ return_dict: true
1033
+ return_dict_in_generate: false
1034
+ sep_token_id: null
1035
+ suppress_tokens: null
1036
+ task_specific_params: null
1037
+ temperature: 1
1038
+ text_config:
1039
+ _name_or_path: ""
1040
+ add_cross_attention: false
1041
+ architectures: null
1042
+ attention_bias: false
1043
+ attention_dropout: 0
1044
+ bad_words_ids: null
1045
+ begin_suppress_tokens: null
1046
+ bos_token_id: null
1047
+ chunk_size_feed_forward: 0
1048
+ cross_attention_hidden_size: null
1049
+ decoder_start_token_id: null
1050
+ diversity_penalty: 0
1051
+ do_sample: false
1052
+ dtype: null
1053
+ early_stopping: false
1054
+ encoder_no_repeat_ngram_size: 0
1055
+ eos_token_id: null
1056
+ exponential_decay_length_penalty: null
1057
+ finetuning_task: null
1058
+ forced_bos_token_id: null
1059
+ forced_eos_token_id: null
1060
+ head_dim: 128
1061
+ hidden_act: silu
1062
+ hidden_size: 2048
1063
+ id2label:
1064
+ "0": LABEL_0
1065
+ "1": LABEL_1
1066
+ initializer_range: 0.02
1067
+ intermediate_size: 6144
1068
+ is_decoder: false
1069
+ is_encoder_decoder: false
1070
+ label2id:
1071
+ LABEL_0: 0
1072
+ LABEL_1: 1
1073
+ length_penalty: 1
1074
+ max_length: 20
1075
+ max_position_embeddings: 65536
1076
+ min_length: 0
1077
+ model_type: qwen3_asr_text
1078
+ no_repeat_ngram_size: 0
1079
+ num_attention_heads: 16
1080
+ num_beam_groups: 1
1081
+ num_beams: 1
1082
+ num_hidden_layers: 28
1083
+ num_key_value_heads: 8
1084
+ num_return_sequences: 1
1085
+ output_attentions: false
1086
+ output_hidden_states: false
1087
+ output_scores: false
1088
+ pad_token_id: 151643
1089
+ prefix: null
1090
+ problem_type: null
1091
+ remove_invalid_values: false
1092
+ repetition_penalty: 1
1093
+ return_dict: true
1094
+ return_dict_in_generate: false
1095
+ rms_norm_eps: 1e-06
1096
+ rope_scaling:
1097
+ interleaved: true
1098
+ mrope_interleaved: true
1099
+ mrope_section:
1100
+ - 24
1101
+ - 20
1102
+ - 20
1103
+ rope_type: default
1104
+ type: default
1105
+ rope_theta: 1000000
1106
+ sep_token_id: null
1107
+ suppress_tokens: null
1108
+ task_specific_params: null
1109
+ temperature: 1
1110
+ tf_legacy_loss: false
1111
+ tie_encoder_decoder: false
1112
+ tie_word_embeddings: true
1113
+ tokenizer_class: null
1114
+ top_k: 50
1115
+ top_p: 1
1116
+ torchscript: false
1117
+ typical_p: 1
1118
+ use_bfloat16: false
1119
+ use_cache: false
1120
+ vocab_size: 151936
1121
+ tf_legacy_loss: false
1122
+ tie_encoder_decoder: false
1123
+ tie_word_embeddings: true
1124
+ tokenizer_class: null
1125
+ top_k: 50
1126
+ top_p: 1
1127
+ torchscript: false
1128
+ typical_p: 1
1129
+ use_bfloat16: false
1130
+ user_token_id: 872
1131
+ tie_encoder_decoder:
1132
+ value: false
1133
+ tie_word_embeddings:
1134
+ value: true
1135
+ tokenizer_class:
1136
+ value: null
1137
+ top_entropy_quantile:
1138
+ value: 1
1139
+ top_k:
1140
+ value: 50
1141
+ top_p:
1142
+ value: 0.95
1143
+ torch_compile:
1144
+ value: false
1145
+ torch_compile_backend:
1146
+ value: null
1147
+ torch_compile_mode:
1148
+ value: null
1149
+ torch_empty_cache_steps:
1150
+ value: null
1151
+ torchdynamo:
1152
+ value: null
1153
+ torchscript:
1154
+ value: false
1155
+ tpu_metrics_debug:
1156
+ value: false
1157
+ tpu_num_cores:
1158
+ value: null
1159
+ trackio_space_id:
1160
+ value: trackio
1161
+ train_dataloader_shuffle:
1162
+ value: true
1163
+ transformers_version:
1164
+ value: 4.57.6
1165
+ tuner_backend:
1166
+ value: peft
1167
+ tuner_type:
1168
+ value: lora
1169
+ typical_p:
1170
+ value: 1
1171
+ use_bfloat16:
1172
+ value: false
1173
+ use_bias_correction_kl:
1174
+ value: false
1175
+ use_cpu:
1176
+ value: false
1177
+ use_flash_ckpt:
1178
+ value: false
1179
+ use_galore:
1180
+ value: false
1181
+ use_legacy_prediction_loop:
1182
+ value: false
1183
+ use_liger_kernel:
1184
+ value: false
1185
+ use_logits_to_keep:
1186
+ value: null
1187
+ use_mps_device:
1188
+ value: false
1189
+ use_transformers_paged:
1190
+ value: false
1191
+ use_vllm:
1192
+ value: false
1193
+ vit_gradient_checkpointing:
1194
+ value: true
1195
+ vit_lr:
1196
+ value: null
1197
+ vllm_data_parallel_size:
1198
+ value: 1
1199
+ vllm_disable_cascade_attn:
1200
+ value: false
1201
+ vllm_disable_custom_all_reduce:
1202
+ value: true
1203
+ vllm_enable_expert_parallel:
1204
+ value: false
1205
+ vllm_enable_lora:
1206
+ value: false
1207
+ vllm_enable_prefix_caching:
1208
+ value: true
1209
+ vllm_enable_sleep_mode:
1210
+ value: false
1211
+ vllm_enforce_eager:
1212
+ value: false
1213
+ vllm_gpu_memory_utilization:
1214
+ value: 0.9
1215
+ vllm_group_port:
1216
+ value: 51216
1217
+ vllm_importance_sampling_cap:
1218
+ value: 3
1219
+ vllm_importance_sampling_correction:
1220
+ value: true
1221
+ vllm_importance_sampling_mode:
1222
+ value: sequence_mask
1223
+ vllm_limit_mm_per_prompt:
1224
+ value: null
1225
+ vllm_max_lora_rank:
1226
+ value: 16
1227
+ vllm_max_model_len:
1228
+ value: null
1229
+ vllm_max_model_length:
1230
+ value: null
1231
+ vllm_max_num_seqs:
1232
+ value: null
1233
+ vllm_mm_processor_cache_gb:
1234
+ value: null
1235
+ vllm_mode:
1236
+ value: null
1237
+ vllm_model_impl:
1238
+ value: vllm
1239
+ vllm_pipeline_parallel_size:
1240
+ value: 1
1241
+ vllm_quantization:
1242
+ value: null
1243
+ vllm_reasoning_parser:
1244
+ value: null
1245
+ vllm_server_base_url:
1246
+ value: null
1247
+ vllm_server_group_port:
1248
+ value: null
1249
+ vllm_server_host:
1250
+ value: null
1251
+ vllm_server_pass_dataset:
1252
+ value: false
1253
+ vllm_server_port:
1254
+ value:
1255
+ - 8000
1256
+ vllm_server_timeout:
1257
+ value: 240
1258
+ vllm_speculative_config:
1259
+ value: null
1260
+ vllm_structured_outputs_regex:
1261
+ value: null
1262
+ vllm_tensor_parallel_size:
1263
+ value: 1
1264
+ vllm_use_async_engine:
1265
+ value: null
1266
+ wandb_log_unique_prompts:
1267
+ value: null
1268
+ warmup_ratio:
1269
+ value: 0.03
1270
+ warmup_steps:
1271
+ value: 0
1272
+ weight_decay:
1273
+ value: 0.1
wandb/run-20260417_125349-3c0s7mq3/files/media/table/completions_1_1de95d5626025fdbb34e.table.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"columns": ["step", "prompt", "completion", "ASRWerSubLenCmpHalluDirtyV56", "advantages", "solution"], "data": [["1", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>I had stood by him, whatever the others said.<|im_end|>", -0.18555980920791626, -0.256487101316452, "i'd ha stood by him whatever the others said"], ["1", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>I had stood by him, whatever the others said.<|im_end|>", -0.18555980920791626, -0.256487101316452, "i'd ha stood by him whatever the others said"], ["1", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>I had stood by him, whatever the others said.<|im_end|>", -0.18555980920791626, -0.256487101316452, "i'd ha stood by him whatever the others said"], ["1", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>I had stood by him, whatever the others said.<|im_end|>", -0.18555980920791626, -0.256487101316452, "i'd ha stood by him whatever the others said"], ["1", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>I had stood by him, whatever the others said.<|im_end|>", -0.18555980920791626, -0.256487101316452, "i'd ha stood by him whatever the others said"], ["1", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>I had stood by him, whatever the others said.<|im_end|>", -0.18555980920791626, -0.256487101316452, "i'd ha stood by him whatever the others said"], ["1", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>I had stood by him, whatever the others said.<|im_end|>", -0.18555980920791626, -0.256487101316452, "i'd ha stood by him whatever the others said"], ["1", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>I had stood by him, whatever the others said.<|im_end|>", -0.18555980920791626, -0.256487101316452, "i'd ha stood by him whatever the others said"], ["1", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>I had stood by him, whatever the others said.<|im_end|>", -0.18555980920791626, -0.256487101316452, "i'd ha stood by him whatever the others said"], ["1", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>I had stood by him, whatever the others said.<|im_end|>", -0.18555980920791626, -0.256487101316452, "i'd ha stood by him whatever the others said"], ["1", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>I has stood by him, whatever the others said.<|im_end|>", -0.18279924988746643, 2.8213913440704346, "i'd ha stood by him whatever the others said"], ["1", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>I had stood by him, whatever the others said.<|im_end|>", -0.18555980920791626, -0.256487101316452, "i'd ha stood by him whatever the others said"], ["1", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>The reverend rectumist passed his hand wearily over his brow a hill with a faint noise of running up stairs somewhere we never touched the beastly box, said he then your competitors did said missus naylor no no said the curate hastily<|im_end|>", -0.2760888338088989, -0.9180124998092651, "The reverend septimus passed his hand wearily over his brow. I feel a little faint, he said, running upstairs so quickly, we never touched the beastly box, said robert. Then your confederates did said miss selina. No, no, said the curate hastily."], ["1", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>The reverend recteur passed his hand wearily over his brow a hill with a faint memory of running upstairs so quickly, we never touched the beastly box said he then your competitor is dead said missus nisbet no, no said the curate hastily.<|im_end|>", -0.09747578948736191, 0.25090181827545166, "The reverend septimus passed his hand wearily over his brow. I feel a little faint, he said, running upstairs so quickly, we never touched the beastly box, said robert. Then your confederates did said miss selina. No, no, said the curate hastily."], ["1", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>The reverend recteur passed his hand wearily over his brow a hill with a fainting spell in it upstairs, he said. We never touched the beastly box before and your competitor did, said missus nina no, no, said the curate hastily.<|im_end|>", -0.4100283682346344, -1.7945656776428223, "The reverend septimus passed his hand wearily over his brow. I feel a little faint, he said, running upstairs so quickly, we never touched the beastly box, said robert. Then your confederates did said miss selina. No, no, said the curate hastily."], ["1", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>The reverend rectory passed his hand wearily over his brow. I feel a little faint, Missus Allen, upstairs said vicar. We never touched the beastly box, did we? Then your competitor is dead, said missus allen no no said the curate hastily.<|im_end|>", 0.06087213382124901, 1.2871931791305542, "The reverend septimus passed his hand wearily over his brow. I feel a little faint, he said, running upstairs so quickly, we never touched the beastly box, said robert. Then your confederates did said miss selina. No, no, said the curate hastily."], ["1", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>The reverend recteur passed his hand wearily over his brow a hillwood of faintness and running upstairs so quickly we never touched the beastly box said the vicar then your competitor did said missus nelly no, no said the curate hastily<|im_end|>", -0.06288440525531769, 0.47728151082992554, "The reverend septimus passed his hand wearily over his brow. I feel a little faint, he said, running upstairs so quickly, we never touched the beastly box, said robert. Then your confederates did said miss selina. No, no, said the curate hastily."], ["1", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>The reverend recteur passed his hand wearily over his brow a hill of saint nicholas went upstairs so quickly we never touched the beastly box then your competitor did said missus nixon no, no, said the curate hastily.<|im_end|>", 0.01360579114407301, 0.9778635501861572, "The reverend septimus passed his hand wearily over his brow. I feel a little faint, he said, running upstairs so quickly, we never touched the beastly box, said robert. Then your confederates did said miss selina. No, no, said the curate hastily."], ["1", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>The reverend rectumist passed his hand wearily over his brow a still little faintness had been running up stairs since dinner. We never touched the beastly box, said he and your competitor did, said missus anna no, no, said the curate hastily.<|im_end|>", -0.15452256798744202, -0.1224348247051239, "The reverend septimus passed his hand wearily over his brow. I feel a little faint, he said, running upstairs so quickly, we never touched the beastly box, said robert. Then your confederates did said miss selina. No, no, said the curate hastily."], ["1", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>The reverend recteur passed his hand wearily over his brow, a hill with a faint memory of running upstairs so quickly. We never touched the beastly box before. Then your competitor did said missus nixon no no said the curate hastily.<|im_end|>", -0.17706401646137238, -0.26995497941970825, "The reverend septimus passed his hand wearily over his brow. I feel a little faint, he said, running upstairs so quickly, we never touched the beastly box, said robert. Then your confederates did said miss selina. No, no, said the curate hastily."], ["1", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>The reverend rectumist passed his hand wearily over his brow a hillwood of faintness and running upstairs so quickly, we never touched the beastly box. Then your competitor did said missus nixon no no said the curate hastily.<|im_end|>", 0.016543198376893997, 0.9970871210098267, "The reverend septimus passed his hand wearily over his brow. I feel a little faint, he said, running upstairs so quickly, we never touched the beastly box, said robert. Then your confederates did said miss selina. No, no, said the curate hastily."], ["1", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>The reverend rectors passed his hand wearily over his brow, a hill with a faint memory of running upstairs so quickly. We never touched the beastly box. Then your competitor did said missus neale no no said the curate hastily.<|im_end|>", -0.1560557782649994, -0.13246876001358032, "The reverend septimus passed his hand wearily over his brow. I feel a little faint, he said, running upstairs so quickly, we never touched the beastly box, said robert. Then your confederates did said miss selina. No, no, said the curate hastily."], ["1", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>The reverend recteur passed his hand wearily over his brow a hill with a faint moonlight running upstairs so quickly, we never touched the beastly box said he then you're a competitor, it seems said missus nixon no no said the curate hastily<|im_end|>", -0.36874449253082275, -1.5243877172470093, "The reverend septimus passed his hand wearily over his brow. I feel a little faint, he said, running upstairs so quickly, we never touched the beastly box, said robert. Then your confederates did said miss selina. No, no, said the curate hastily."], ["1", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>The reverend recteur passed his hand wearily over his brow, I feel a little faint now that I am upstairs so quickly. We never touched the vesuvio, said the doctor. Then your competitors did, said missus nina. No, no, said the curate hastily.<|im_end|>", -0.01792760007083416, 0.771496593952179, "The reverend septimus passed his hand wearily over his brow. I feel a little faint, he said, running upstairs so quickly, we never touched the beastly box, said robert. Then your confederates did said miss selina. No, no, said the curate hastily."], ["1", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>There was much armaghajt in my cousin's sister, the political aspect of the revolution is fenced changing almost every day she might not understand how his own views and sympathies might often modify her.<|im_end|>", -0.025386638939380646, -1.575260877609253, "There was much armand saint just could not tell his sister the political aspect of the revolution in france was changing almost every day. She might not understand how his own views and sympathies might become modified."], ["1", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>There was much armagnac julec in my parent's estate, the political aspect of the revolution since changing almost every day she might not understand how his own views and sympathies might often modify them.<|im_end|>", -0.03027840331196785, -1.6189521551132202, "There was much armand saint just could not tell his sister the political aspect of the revolution in france was changing almost every day. She might not understand how his own views and sympathies might become modified."], ["1", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>There was much armagnac jokes with my cousins and sister, the political aspect of the revolution in france changing almost every day she might not understand how his own views and sympathies might differ from mine.<|im_end|>", 0.10477012395858765, -0.41274797916412354, "There was much armand saint just could not tell his sister the political aspect of the revolution in france was changing almost every day. She might not understand how his own views and sympathies might become modified."], ["1", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>There was much armagnac joke for my cousin sister, the political aspect of the revolution in france changing almost every day she might not understand how his own views and sympathies might often modify those.<|im_end|>", 0.11768282204866409, -0.29741644859313965, "There was much armand saint just could not tell his sister the political aspect of the revolution in france was changing almost every day. She might not understand how his own views and sympathies might become modified."], ["1", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>There was much armagnac joke from my cousin sister, the political aspect of the revolution in france changing almost every day she might not understand how his own views and sympathies might be modified.<|im_end|>", 0.2628527879714966, 0.9991887807846069, "There was much armand saint just could not tell his sister the political aspect of the revolution in france was changing almost every day. She might not understand how his own views and sympathies might become modified."], ["1", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>There was much armageddus in my present system. The political aspect of the revolution is hence changing almost every day. She might not understand how his own views and sympathies might often modify mine.<|im_end|>", 0.05142616108059883, -0.8891968727111816, "There was much armand saint just could not tell his sister the political aspect of the revolution in france was changing almost every day. She might not understand how his own views and sympathies might become modified."], ["1", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>There was much armagnac, jute and matelot in his tea. The political aspect of the revolution is hence changing almost every day. She might not understand how his own views and sympathies might have been modified.<|im_end|>", 0.18227215111255646, 0.27947190403938293, "There was much armand saint just could not tell his sister the political aspect of the revolution in france was changing almost every day. She might not understand how his own views and sympathies might become modified."], ["1", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>There was much armagnac, jute for my companion sister. The political aspect of the revolution in france changing almost every day. She might not understand how his own views and sympathies might often modify.<|im_end|>", 0.257134348154068, 0.9481137990951538, "There was much armand saint just could not tell his sister the political aspect of the revolution in france was changing almost every day. She might not understand how his own views and sympathies might become modified."], ["1", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>There was much armagnac yoke to my cousin's sister, the political aspect of the revolution in france changing almost every day she might not understand how his own views and sympathies might differ from mine.<|im_end|>", 0.11708571761846542, -0.3027495741844177, "There was much armand saint just could not tell his sister the political aspect of the revolution in france was changing almost every day. She might not understand how his own views and sympathies might become modified."], ["1", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>There was much armagnac joke to my cousin's sister, the political aspect of the revolution in france changing almost every day she might not understand how his own views and sympathies might be modified.<|im_end|>", 0.2641826272010803, 1.0110664367675781, "There was much armand saint just could not tell his sister the political aspect of the revolution in france was changing almost every day. She might not understand how his own views and sympathies might become modified."], ["1", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>There was much armagnac joke with my cousins sister, the political aspect of the revolution in france changing almost every day she might not understand how his own views and sympathies might be modified.<|im_end|>", 0.26373809576034546, 1.0070960521697998, "There was much armand saint just could not tell his sister the political aspect of the revolution in france was changing almost every day. She might not understand how his own views and sympathies might become modified."], ["1", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>There was much armagnac yet for my traveling sister. The political aspect of the revolution in france is changing almost every day. She might not understand how her own views and sympathies might be modified.<|im_end|>", 0.24630455672740936, 0.8513860106468201, "There was much armand saint just could not tell his sister the political aspect of the revolution in france was changing almost every day. She might not understand how his own views and sympathies might become modified."], ["1", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Never, private or public, that the order should be payable in India and to bear an interest of five per cent if these orders were supposed to be vicious by reason of being purchased he secondly with very little hesitation adopted both orders were immediately printed.<|im_end|>", -0.3420386016368866, -0.659913957118988, "and therefore i propos'd that the orders should be payable in a year and to bear an interest of five per cent with these orders i suppos'd the provisions might easily be purchas'd the assembly with very little hesitation adopted the proposal the orders were immediately printed"], ["1", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Never, rather opposed that the order should be payable in India and do bear an interest of five per cent if these orders were disposed of provisions might easily be purchased he seconded with very little hesitation adopted both orders were immediately printed.<|im_end|>", -0.032027214765548706, 1.195294737815857, "and therefore i propos'd that the orders should be payable in a year and to bear an interest of five per cent with these orders i suppos'd the provisions might easily be purchas'd the assembly with very little hesitation adopted the proposal the orders were immediately printed"], ["1", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Never, either of both that they ordered it should be payable in a year and do bear an interest of five per cent if these orders were disposed of provisions might easily be purchased he said with very little hesitation adopted by both orders were immediately printed.<|im_end|>", -0.04057157412171364, 1.1441625356674194, "and therefore i propos'd that the orders should be payable in a year and to bear an interest of five per cent with these orders i suppos'd the provisions might easily be purchas'd the assembly with very little hesitation adopted the proposal the orders were immediately printed"], ["1", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Never prior to public opinion that the order should be payable in any and do bearing interest of five per cent if these orders were supposed provisionists might easily be purchased this enactment with very little hesitation adopted by both voters were immediately printed.<|im_end|>", -0.3433881402015686, -0.6679900288581848, "and therefore i propos'd that the orders should be payable in a year and to bear an interest of five per cent with these orders i suppos'd the provisions might easily be purchas'd the assembly with very little hesitation adopted the proposal the orders were immediately printed"], ["1", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Never, prior to the public that they ordered it should be payable in a year and do bear an interest of five per cent if these orders were disposed of provisionally at least would be purchased he said with very little hesitation adopted both orders were immediately printed.<|im_end|>", -0.33630597591400146, -0.6256080865859985, "and therefore i propos'd that the orders should be payable in a year and to bear an interest of five per cent with these orders i suppos'd the provisions might easily be purchas'd the assembly with very little hesitation adopted the proposal the orders were immediately printed"], ["1", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Never prior to publication that the order should be payable in any year and do bear an interest of five per cent if these orders were disposed of provisionally at least could be purchased he said with very little hesitation adopted both orders were immediately printed<|im_end|>", -0.1676534116268158, 0.3836635649204254, "and therefore i propos'd that the orders should be payable in a year and to bear an interest of five per cent with these orders i suppos'd the provisions might easily be purchas'd the assembly with very little hesitation adopted the proposal the orders were immediately printed"], ["1", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Never prior to public opinion that they ordered it should be payable in India and do bear an interest of five per cent if these orders were supposed provision is likely soon to be purchased this act with very little hesitation adopted by both voters were immediately printed.<|im_end|>", -0.5411341190338135, -1.8513660430908203, "and therefore i propos'd that the orders should be payable in a year and to bear an interest of five per cent with these orders i suppos'd the provisions might easily be purchas'd the assembly with very little hesitation adopted the proposal the orders were immediately printed"], ["1", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Never prior to public debate that the order should be payable in England and do bear an interest of five per cent if these orders were to suppose the provisions might easily be purchased he seconded with very little hesitation adopted both orders were immediately printed.<|im_end|>", -0.07721911370754242, 0.9248517155647278, "and therefore i propos'd that the orders should be payable in a year and to bear an interest of five per cent with these orders i suppos'd the provisions might easily be purchas'd the assembly with very little hesitation adopted the proposal the orders were immediately printed"], ["1", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Never, prior to publication that they ordered it should be payable in a year and do bear an interest of five per cent if these orders were disposed of provisionally at least would be purchased is now with very little hesitation adopted both orders were immediately printed<|im_end|>", -0.22012776136398315, 0.06964004039764404, "and therefore i propos'd that the orders should be payable in a year and to bear an interest of five per cent with these orders i suppos'd the provisions might easily be purchas'd the assembly with very little hesitation adopted the proposal the orders were immediately printed"], ["1", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Never prior to published that the order should be payable in a year and do bear an interest of five per cent, if these orders were disposed of provisionally at least would be purchased he seconded with very little hesitation adopted both orders were immediately printed<|im_end|>", -0.16621676087379456, 0.39226093888282776, "and therefore i propos'd that the orders should be payable in a year and to bear an interest of five per cent with these orders i suppos'd the provisions might easily be purchas'd the assembly with very little hesitation adopted the proposal the orders were immediately printed"], ["1", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Never, cried her beloved, that the order should be payable in England and do bear interest at five per cent if these orders were disposed of provisionally at least would they purchase he said with very little hesitation adopted them both the orders were immediately printed.<|im_end|>", -0.4380200207233429, -1.2342978715896606, "and therefore i propos'd that the orders should be payable in a year and to bear an interest of five per cent with these orders i suppos'd the provisions might easily be purchas'd the assembly with very little hesitation adopted the proposal the orders were immediately printed"], ["1", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Never prior to public debate that they ordered it should be payable in a year and to bear an interest of five per cent if these orders were supposed provisionists might easily be purchased he seconded with very little hesitation adopted both orders were immediately printed.<|im_end|>", -0.07647529989480972, 0.9293028712272644, "and therefore i propos'd that the orders should be payable in a year and to bear an interest of five per cent with these orders i suppos'd the provisions might easily be purchas'd the assembly with very little hesitation adopted the proposal the orders were immediately printed"]]}
wandb/run-20260417_125349-3c0s7mq3/files/media/table/completions_3_b8120af2e2a4bc038eb5.table.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"columns": ["step", "prompt", "completion", "ASRWerSubLenCmpHalluDirtyV56", "advantages", "solution"], "data": [["5", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Coordinating and shifting, collectively said he sheu, divided with each other in forming new combinations. We must remember however that the flower worship of the tibetans was formed from only a part of their ascetic ritual and it was not a distinct religion by itself.<|im_end|>", 0.06746125966310501, 0.25112149119377136, "kobori enshiu katagiri sekishiu vied with each other in forming new combinations we must remember however that the flower worship of the tea masters formed only a part of their aesthetic ritual and was not a distinct religion by itself"], ["5", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Kohori and shi no katanu ni seki shi no vied with each other in forming new combinations. We must remember, however, that the flower worship of the tea masters formed only a part of their ascetic ritual, and it was not a distinct religion by itself.<|im_end|>", 0.008763517253100872, -0.30829519033432007, "kobori enshiu katagiri sekishiu vied with each other in forming new combinations we must remember however that the flower worship of the tea masters formed only a part of their aesthetic ritual and was not a distinct religion by itself"], ["5", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Coordinating and shifting, collectively setting shift, fighting with each other in forming new combinations. We must remember, however, that the flower worship of the teengas performed only a part of their respective ritual, and was not a distinct religion by itself.<|im_end|>", -0.017216404899954796, -0.5558958649635315, "kobori enshiu katagiri sekishiu vied with each other in forming new combinations we must remember however that the flower worship of the tea masters formed only a part of their aesthetic ritual and was not a distinct religion by itself"], ["5", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Coordinating and shifting, collectively said he she would divide with each other in forming new combinations we must remember however that the flower worship of the tibetans was formed from only a part of their ascetic ritual and it was not a distinct religion by itself<|im_end|>", 0.13382616639137268, 0.8836097717285156, "kobori enshiu katagiri sekishiu vied with each other in forming new combinations we must remember however that the flower worship of the tea masters formed only a part of their aesthetic ritual and was not a distinct religion by itself"], ["5", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Coordinating shibumi, kafanguiyaseki shibumi, fight with each other in forming new combinations. We must remember, however, that the flower worship of the teikos was formed from only a part of their ascetic ritual and it was not a distinct religion by itself.<|im_end|>", 0.12175671756267548, 0.7685823440551758, "kobori enshiu katagiri sekishiu vied with each other in forming new combinations we must remember however that the flower worship of the tea masters formed only a part of their aesthetic ritual and was not a distinct religion by itself"], ["5", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Coordinating and shifting, collectively city shifted, fighting with each other in forming new combinations. We must remember, however, that the flower worship of the teentots performed only a part of their ascetic ritual, and it was not a distinct religion by itself.<|im_end|>", -0.07603159546852112, -1.1164319515228271, "kobori enshiu katagiri sekishiu vied with each other in forming new combinations we must remember however that the flower worship of the tea masters formed only a part of their aesthetic ritual and was not a distinct religion by itself"], ["5", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Coordinating shiwoo, collectively said yishii, vied with each other in forming new combinations. We must remember however that the flower worship of the teegas was but only a part of their ascetic ritual, and it was not a distinct religion by itself.<|im_end|>", 0.18717117607593536, 1.3920124769210815, "kobori enshiu katagiri sekishiu vied with each other in forming new combinations we must remember however that the flower worship of the tea masters formed only a part of their aesthetic ritual and was not a distinct religion by itself"], ["5", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Coordinating and shifting, coupling these subunits, varied with each other in forming new combinations. We must remember, however, that the flower worship of the teentas performed only a part of their ascetic ritual, and it was not a distinct religion by itself.<|im_end|>", -0.07198049873113632, -1.0778230428695679, "kobori enshiu katagiri sekishiu vied with each other in forming new combinations we must remember however that the flower worship of the tea masters formed only a part of their aesthetic ritual and was not a distinct religion by itself"], ["5", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Coordinating and shu, ka te nuisi se ki shu fight with each other in forming new combinations we must remember however that the flower worship of the tinus performed only a part of their ascetic ritual and was not a distinct religion by itself.<|im_end|>", 0.0946241021156311, 0.5099959969520569, "kobori enshiu katagiri sekishiu vied with each other in forming new combinations we must remember however that the flower worship of the tea masters formed only a part of their aesthetic ritual and was not a distinct religion by itself"], ["5", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Kohori and shiromu kafanuri, sakiishi, vied with each other in forming new combinations. We must remember however that the flower worship of the teiyas was but only a part of their ascetic ritual, and it was not a distinct religion by itself.<|im_end|>", 0.193635493516922, 1.453620433807373, "kobori enshiu katagiri sekishiu vied with each other in forming new combinations we must remember however that the flower worship of the tea masters formed only a part of their aesthetic ritual and was not a distinct religion by itself"], ["5", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Coordinating and shifting, collectively setting shift, fighting with each other in forming new combinations. We must remember, however, that the flower worship of the teentas performed only a part of their ascetic ritual, and it was not a distinct religion by itself.<|im_end|>", -0.0758325457572937, -1.1145349740982056, "kobori enshiu katagiri sekishiu vied with each other in forming new combinations we must remember however that the flower worship of the tea masters formed only a part of their aesthetic ritual and was not a distinct religion by itself"], ["5", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Cohorti and instituti, capellanus et institutus, fight with each other in forming new combinations. We must remember, however, that the flower worship of the tegots was formed from only a part of their ascetic ritual, and it was not a distinct religion by itself.<|im_end|>", -0.07283444702625275, -1.0859616994857788, "kobori enshiu katagiri sekishiu vied with each other in forming new combinations we must remember however that the flower worship of the tea masters formed only a part of their aesthetic ritual and was not a distinct religion by itself"], ["5", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>With red hot boulders lying about everywhere, d'you think it went off well? Creedle he asked her. The victuals did that I know and the drink did that I set fast in believe upon a sound of barrels good honest drink.<|im_end|>", 0.16612012684345245, -0.016373056918382645, "with red hot bowlders lying about everywhere do you think it went off well creedle he asked the victuals did that i know and the drink did that i steadfastly believe from the holler sound of the barrels good honest drink"], ["5", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>With red hot boulders lying about everywhere, d'you think it went off well? Creedele he asked me. The victuals did that I know and the drink did that I set fasty believe upon a sound of barrels good honest drink.<|im_end|>", 0.15556275844573975, -0.08780591189861298, "with red hot bowlders lying about everywhere do you think it went off well creedle he asked the victuals did that i know and the drink did that i steadfastly believe from the holler sound of the barrels good honest drink"], ["5", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>With red hot bolters flying about everywhere, do you think it went off well creedle? He asked me the victuals did that I know and the drink did that I set fast to believe upon a sound of barrels good honest strength.<|im_end|>", 0.2218746393918991, 0.36087095737457275, "with red hot bowlders lying about everywhere do you think it went off well creedle he asked the victuals did that i know and the drink did that i steadfastly believe from the holler sound of the barrels good honest drink"], ["5", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>With red hot boulders lying about everywhere, do you think it went off well? Creedle he asked her. The victuals did that I know and the drink did that I steadfastly believe upon a chance of barrels good honest drink.<|im_end|>", 0.42252233624458313, 1.7184855937957764, "with red hot bowlders lying about everywhere do you think it went off well creedle he asked the victuals did that i know and the drink did that i steadfastly believe from the holler sound of the barrels good honest drink"], ["5", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>With red hot boulders flying about everywhere, do you think it went off well? Creel he asked. The victuals did that I know and the drink did that I set fasty believe upon a shanty barrels good honest strength.<|im_end|>", 0.07005643844604492, -0.6663554310798645, "with red hot bowlders lying about everywhere do you think it went off well creedle he asked the victuals did that i know and the drink did that i steadfastly believe from the holler sound of the barrels good honest drink"], ["5", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>With red hot bolters flying about everywhere, do you think it went off well? Creedle he asked her. The victuals did that I know and the drink did that I set fast to believe upon a challenge of barrels good honest strength.<|im_end|>", 0.1369437873363495, -0.21378487348556519, "with red hot bowlders lying about everywhere do you think it went off well creedle he asked the victuals did that i know and the drink did that i steadfastly believe from the holler sound of the barrels good honest drink"], ["5", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>With red hot boulders flying about everywhere, do you think it went off well? Creel he asked the victors did that I know and the drink did that I steadfastly believe upon a sound of barrels good honest drink.<|im_end|>", 0.3446210026741028, 1.1913926601409912, "with red hot bowlders lying about everywhere do you think it went off well creedle he asked the victuals did that i know and the drink did that i steadfastly believe from the holler sound of the barrels good honest drink"], ["5", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>With red hot boulders flying about everywhere, do you think it went off well? Creedele he asked her, the victuals did that I know and the drink did that I steadfastly believe upon a sound of barrels good honest drink.<|im_end|>", 0.3581290543079376, 1.2827903032302856, "with red hot bowlders lying about everywhere do you think it went off well creedle he asked the victuals did that i know and the drink did that i steadfastly believe from the holler sound of the barrels good honest drink"], ["5", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>With red hot boulders flying about everywhere, do you think it went off well? Creel he asked. The victuals did that I know, and the drink did that I said pass'd me believe upon a trial in barrels good honest drink.<|im_end|>", -0.024973222985863686, -1.309341549873352, "with red hot bowlders lying about everywhere do you think it went off well creedle he asked the victuals did that i know and the drink did that i steadfastly believe from the holler sound of the barrels good honest drink"], ["5", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>With red hot bolters flying about everywhere, d'you think it went off well? Creel he asked her. The victuals did that I know, and the drink did. That I set fasty believe upon a sound of barrels good honest strength.<|im_end|>", -0.054762814193964005, -1.5109026432037354, "with red hot bowlders lying about everywhere do you think it went off well creedle he asked the victuals did that i know and the drink did that i steadfastly believe from the holler sound of the barrels good honest drink"], ["5", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>With red hot boulders lying about everywhere, do you think it went off well? Creel he asked her the victuals did that I know and the drink did that I set fast to believe upon a chance of barrels good honest drink.<|im_end|>", 0.1390748769044876, -0.19936557114124298, "with red hot bowlders lying about everywhere do you think it went off well creedle he asked the victuals did that i know and the drink did that i steadfastly believe from the holler sound of the barrels good honest drink"], ["5", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>With red hot boulders lying about everywhere, d'you think it went off well, creedle? He asked. The victuals did that I know and the drink did that I said must be believed upon a sound of barrels good honest drink.<|im_end|>", 0.08731066435575485, -0.5496105551719666, "with red hot bowlders lying about everywhere do you think it went off well creedle he asked the victuals did that i know and the drink did that i steadfastly believe from the holler sound of the barrels good honest drink"], ["5", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>For it is wonderful how many things may be acquired by some means a writer was once employed in which of course he got continual friends and you pick up mary hansen gilding on the colonies of abies, which seems answer to your friend's wants.<|im_end|>", -0.8597428202629089, -1.7000007629394531, "For it is wonderful how soon these are acquired by some horses. The writer was once employed to purchase a horse for a country friend. And he picked a very handsome gelding out of collins's stables, which seemed to answer to his friend's wants."], ["5", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>For it is wonderful how a name can be acquired by some means the writer was once employed in preaching a course of instruction to friends and repeated very handsome gilding on the columns of statues which seemed to answer to his friend's wants.<|im_end|>", -0.28019994497299194, 0.7384878396987915, "For it is wonderful how soon these are acquired by some horses. The writer was once employed to purchase a horse for a country friend. And he picked a very handsome gelding out of collins's stables, which seemed to answer to his friend's wants."], ["5", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>For it is wonderful how men can be inspired by some things a writer was once employed in preaching a course of lectures to his friends, and he picked up very handsome gelding on the colony's estate which seems answer to the prince's wants.<|im_end|>", -0.4687815308570862, -0.05498935654759407, "For it is wonderful how soon these are acquired by some horses. The writer was once employed to purchase a horse for a country friend. And he picked a very handsome gelding out of collins's stables, which seemed to answer to his friend's wants."], ["5", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>For it is wonderful how names may be acquired by some means. The writer was once employed in preaching before a group of young friends, and repeated his merry fencing gelping on the colonies of babies which seems answer to the friend's wants.<|im_end|>", -0.6376533508300781, -0.7655355930328369, "For it is wonderful how soon these are acquired by some horses. The writer was once employed to purchase a horse for a country friend. And he picked a very handsome gelding out of collins's stables, which seemed to answer to his friend's wants."], ["5", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>For it is wonderful how many things may be acquired by some means. The writer was once employed in purchase of horses from his friends, and repeated a very handsome gelding on the colony's table, which seemed to answer to his friend's wants.<|im_end|>", -0.07159067690372467, 1.6162337064743042, "For it is wonderful how soon these are acquired by some horses. The writer was once employed to purchase a horse for a country friend. And he picked a very handsome gelding out of collins's stables, which seemed to answer to his friend's wants."], ["5", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>For it is wonderful how names can be acquired by some means a writer was once employed in teaching a boy about his own friends, and he picked up very handsome gelding on the colony of cape town which seemed to answer just what he wanted.<|im_end|>", -0.39772796630859375, 0.24397611618041992, "For it is wonderful how soon these are acquired by some horses. The writer was once employed to purchase a horse for a country friend. And he picked a very handsome gelding out of collins's stables, which seemed to answer to his friend's wants."], ["5", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>For it is wonderful how many things are required by some people. The writer was once employed in teaching a course of lectures to his friends, and he picked up very handsome gelding on the colonies of bays which seemed to answer just at his wants.<|im_end|>", -0.31977492570877075, 0.5719718337059021, "For it is wonderful how soon these are acquired by some horses. The writer was once employed to purchase a horse for a country friend. And he picked a very handsome gelding out of collins's stables, which seemed to answer to his friend's wants."], ["5", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>For it is wonderful how a name can be acquired by some means. The writer was once employed in purchase of horses for his friends, and he picked up very handsome geldings on the colonies of scotland, which seems answer to his friend's wants.<|im_end|>", -0.23753882944583893, 0.9179890155792236, "For it is wonderful how soon these are acquired by some horses. The writer was once employed to purchase a horse for a country friend. And he picked a very handsome gelding out of collins's stables, which seemed to answer to his friend's wants."], ["5", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>For it is wonderful how a name can be acquired by some means. The writer was once employed in preaching before a congregation of friends, and repeated very handsome gilding on the columns of tables, which seemed to answer to his friend's wants.<|im_end|>", -0.33328479528427124, 0.5151276588439941, "For it is wonderful how soon these are acquired by some horses. The writer was once employed to purchase a horse for a country friend. And he picked a very handsome gelding out of collins's stables, which seemed to answer to his friend's wants."], ["5", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>For it is wonderful how many names are supplied by some mistake. The writer was once employed in teaching a course of instruction to friends, and repeated Mary Hanson gilding on the colonies of babies, which seems answer to his friend's wants.<|im_end|>", -0.3981190025806427, 0.24233078956604004, "For it is wonderful how soon these are acquired by some horses. The writer was once employed to purchase a horse for a country friend. And he picked a very handsome gelding out of collins's stables, which seemed to answer to his friend's wants."], ["5", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>For it is wonderful how many things can be acquired by some means a writer was once employed in which of course he rubbed his teeth with frank and repeated mary hansen gelling on the colonies of georgia, which seems answer to the friend's wants.<|im_end|>", -0.7842603921890259, -1.382400393486023, "For it is wonderful how soon these are acquired by some horses. The writer was once employed to purchase a horse for a country friend. And he picked a very handsome gelding out of collins's stables, which seemed to answer to his friend's wants."], ["5", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>For it is wonderful how names can be acquired by some mistake. The writer was once employed in teaching a course of natural history at prague, and he pictures mary henshaw gellman on the colony of scotland, which seems answerable to frank's wants.<|im_end|>", -0.6798756718635559, -0.9431905150413513, "For it is wonderful how soon these are acquired by some horses. The writer was once employed to purchase a horse for a country friend. And he picked a very handsome gelding out of collins's stables, which seemed to answer to his friend's wants."], ["5", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>A week after the battle, my brother replied there from the capital of my expedition to make a horrible discovery that followed the eating up of the bodies of our dead heroes at two doors.<|im_end|>", -0.40796396136283875, -0.19726812839508057, "a week after the battle my brother rode by there on a cavalry expedition and made the horrible discovery that hogs were eating up the bodies of our dead heroes that too was war"], ["5", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>A week after the battle, my brother was obliged to enter the capital of my expedition to make a horrible supper at the hall meeting of the bodies of our dead heroes. That too was for it.<|im_end|>", -0.6910028457641602, -0.9820257425308228, "a week after the battle my brother rode by there on a cavalry expedition and made the horrible discovery that hogs were eating up the bodies of our dead heroes that too was war"], ["5", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>A week after the battle, my brother provided her with a capital expedition to make a horrible slaughter at home in eating up the bodies of our dead heroes that too was abortive.<|im_end|>", -0.0851043164730072, 0.6978971362113953, "a week after the battle my brother rode by there on a cavalry expedition and made the horrible discovery that hogs were eating up the bodies of our dead heroes that too was war"], ["5", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>A week after the battle, my brother replied there from the capital of my expedition, in a horrible and stunned, I called at the meeting of the bodies of our dead heroes. That too was a word.<|im_end|>", -0.781724214553833, -1.2335611581802368, "a week after the battle my brother rode by there on a cavalry expedition and made the horrible discovery that hogs were eating up the bodies of our dead heroes that too was war"], ["5", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>A week after the battle, my brother replied there from a capital in my position with a horrible discovery that he had fallen in eating up the bodies of our dead heroes. That too was a word.<|im_end|>", -0.2709154784679413, 0.18271444737911224, "a week after the battle my brother rode by there on a cavalry expedition and made the horrible discovery that hogs were eating up the bodies of our dead heroes that too was war"], ["5", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>A week after the battle, my brother rode by there on a cavalry expedition to make a horrible supper at a hall meeting of the bodies of our dead heroes. That too was thwarted.<|im_end|>", 0.09377644956111908, 1.1938644647598267, "a week after the battle my brother rode by there on a cavalry expedition and made the horrible discovery that hogs were eating up the bodies of our dead heroes that too was war"], ["5", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>A week after the battle, my brother and I were hired by a cavalry expedition to make a horrible study of the fall and eating up of the bodies of our dead heroes. That too was worth it.<|im_end|>", -0.39144468307495117, -0.15146653354167938, "a week after the battle my brother rode by there on a cavalry expedition and made the horrible discovery that hogs were eating up the bodies of our dead heroes that too was war"], ["5", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>A week after the battle, my brother stood by her in a cabin at my expedition and made the horrible discovery that Paul was eating up the body of our dead hero. That too was a word.<|im_end|>", 0.046062320470809937, 1.0615715980529785, "a week after the battle my brother rode by there on a cavalry expedition and made the horrible discovery that hogs were eating up the bodies of our dead heroes that too was war"], ["5", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>A week after the battle, my brother replied there on the capital of my expedition in a most horrible and shocking manner, that he had been the eating up the body of our dead hero. That was true as words.<|im_end|>", -0.8374046683311462, -1.3879414796829224, "a week after the battle my brother rode by there on a cavalry expedition and made the horrible discovery that hogs were eating up the bodies of our dead heroes that too was war"], ["5", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>A week after the battle, my brother replied there in a capital condition, but made the horrible discovery that all were eating up the bodies of our dead heroes at two this morning.<|im_end|>", 0.09645416587591171, 1.2012887001037598, "a week after the battle my brother rode by there on a cavalry expedition and made the horrible discovery that hogs were eating up the bodies of our dead heroes that too was war"], ["5", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>A week after the battle, my brother replied there in a capital condition, but in the horrible stumps that followed eating up the bodies of our dead heroes. That too was worth it.<|im_end|>", -0.051983222365379333, 0.7897290587425232, "a week after the battle my brother rode by there on a cavalry expedition and made the horrible discovery that hogs were eating up the bodies of our dead heroes that too was war"], ["5", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>A week after the battle, my brother replied there from the capital of my expedition, in a most horrible and startling letter that called on me to eat up the bodies of our dead heroes. That too was ordered.<|im_end|>", -0.7605313062667847, -1.1748013496398926, "a week after the battle my brother rode by there on a cavalry expedition and made the horrible discovery that hogs were eating up the bodies of our dead heroes that too was war"]]}
wandb/run-20260417_125349-3c0s7mq3/files/media/table/completions_5_510c5f07b145276e4210.table.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"columns": ["step", "prompt", "completion", "ASRWerSubLenCmpHalluDirtyV56", "advantages", "solution"], "data": [["10", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Instead of listening to you, I tell you that from this day forward, I will give that great man a pension of a thousand pieces of gold per month for his life. Nay, though I were to share with him all my riches and provisions.<|im_end|>", 0.7468931674957275, -0.5118773579597473, "instead of listening to you i tell you that from this day forward i will give that great man a pension of a thousand pieces of gold per month for his life nay though i were to share with him all my riches and dominions"], ["10", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Instead of listening to you, I tell you that from this day forward, I will give that great man a pension of a thousand pieces of gold per month for his life. Nay, though I were to share with him all my riches and dominions.<|im_end|>", 0.7513310313224792, -0.21503543853759766, "instead of listening to you i tell you that from this day forward i will give that great man a pension of a thousand pieces of gold per month for his life nay though i were to share with him all my riches and dominions"], ["10", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Instead of listening to you, I tell you that from this day forward, I will give that great man a pension of a thousand pieces of gold per month for his life. Nay, though I were to share with him all my riches and dominions.<|im_end|>", 0.7513310313224792, -0.21503543853759766, "instead of listening to you i tell you that from this day forward i will give that great man a pension of a thousand pieces of gold per month for his life nay though i were to share with him all my riches and dominions"], ["10", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Instead of listening to you, I tell you that from this day forward, I will give that great man a pension of a thousand pieces of gold per month for his life. Nay, though I were to share with him all my riches and dominions.<|im_end|>", 0.7513310313224792, -0.21503543853759766, "instead of listening to you i tell you that from this day forward i will give that great man a pension of a thousand pieces of gold per month for his life nay though i were to share with him all my riches and dominions"], ["10", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Instead of listening to you, I tell you that from this day forward, I will give that great man a pension of a thousand pieces of gold per month for his life. Nay, though I were to share with him all my riches and dominions.<|im_end|>", 0.7513310313224792, -0.21503543853759766, "instead of listening to you i tell you that from this day forward i will give that great man a pension of a thousand pieces of gold per month for his life nay though i were to share with him all my riches and dominions"], ["10", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Instead of listening to you, I tell you that from this day forward, I will give that great man a pension of a thousand pieces of gold per month for his life. Nay, though I were to share with him all my riches and dominions.<|im_end|>", 0.7513310313224792, -0.21503543853759766, "instead of listening to you i tell you that from this day forward i will give that great man a pension of a thousand pieces of gold per month for his life nay though i were to share with him all my riches and dominions"], ["10", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Instead of listening to you, I tell you that from this day forward, I will give that great man a pension of a thousand pieces of gold per month for his life. Nay, though I were to share with him all my riches and privileges.<|im_end|>", 0.7445108890533447, -0.6712242960929871, "instead of listening to you i tell you that from this day forward i will give that great man a pension of a thousand pieces of gold per month for his life nay though i were to share with him all my riches and dominions"], ["10", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Instead of listening to you, I tell you that from this day forward, I will give that great man a pension of a thousand pieces of gold per month for his life nay, though I were to share with him all my riches and dominions.<|im_end|>", 0.8011671900749207, 3.1184284687042236, "instead of listening to you i tell you that from this day forward i will give that great man a pension of a thousand pieces of gold per month for his life nay though i were to share with him all my riches and dominions"], ["10", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Instead of listening to you, I tell you that from this day forward, I will give that great man a pension of a thousand pieces of gold per month for his life. Nay, though I were to share with him all my riches and dominions.<|im_end|>", 0.7513310313224792, -0.21503543853759766, "instead of listening to you i tell you that from this day forward i will give that great man a pension of a thousand pieces of gold per month for his life nay though i were to share with him all my riches and dominions"], ["10", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Instead of listening to you, I tell you that from this day forward, I will give that great man a pension of a thousand pieces of gold per month for his life. Nay, though I were to share with him all my riches and dominions.<|im_end|>", 0.7513310313224792, -0.21503543853759766, "instead of listening to you i tell you that from this day forward i will give that great man a pension of a thousand pieces of gold per month for his life nay though i were to share with him all my riches and dominions"], ["10", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Instead of listening to you, I tell you that from this day forward, I will give that great man a pension of a thousand pieces of gold per month for his life. Nay, though I were to share with him all my riches and dominions.<|im_end|>", 0.7513310313224792, -0.21503543853759766, "instead of listening to you i tell you that from this day forward i will give that great man a pension of a thousand pieces of gold per month for his life nay though i were to share with him all my riches and dominions"], ["10", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Instead of listening to you, I tell you that from this day forward, I will give that great man a pension of a thousand pieces of gold per month for his life. Nay, though I were to share with him all my riches and dominions.<|im_end|>", 0.7513310313224792, -0.21503543853759766, "instead of listening to you i tell you that from this day forward i will give that great man a pension of a thousand pieces of gold per month for his life nay though i were to share with him all my riches and dominions"], ["10", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>The baker shook his head, but the crime which I have committed now or has just passed on me of justice and you can only deliver me from it by blessing us secretly as you have just done come up handed said the procurator.<|im_end|>", -0.15717686712741852, -1.0923786163330078, "The beggar shook his head. The crime which I have committed, my lord, has no call upon human justice. And you can only deliver me from it by blessing me frequently, as you have just done. Come be candid, said the coadjutor."], ["10", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>The beggar shook his head. The crime which I have committed, my lord, has no place among you in justice, and you can only deliver me from it by blessing me frequently as you have just done. Come, I command it said the procurator.<|im_end|>", 0.34490713477134705, 0.8904600739479065, "The beggar shook his head. The crime which I have committed, my lord, has no call upon human justice. And you can only deliver me from it by blessing me frequently, as you have just done. Come be candid, said the coadjutor."], ["10", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>The baker shook his head, the crime which I have committed now or has been called a thing of justice and you can only deliver me from it by blessing as frequently as you have just done come up hand said the procurator.<|im_end|>", -0.093899667263031, -0.8424832224845886, "The beggar shook his head. The crime which I have committed, my lord, has no call upon human justice. And you can only deliver me from it by blessing me frequently, as you have just done. Come be candid, said the coadjutor."], ["10", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>The baker shook his head, the crime which I have committed my lord has no place in human justice, and you can only deliver me from it by blessing me secretly as you have just done. Come, let's end it said the procurator.<|im_end|>", 0.19140377640724182, 0.2842419743537903, "The beggar shook his head. The crime which I have committed, my lord, has no call upon human justice. And you can only deliver me from it by blessing me frequently, as you have just done. Come be candid, said the coadjutor."], ["10", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>The beggar shook his head, the crime which I have committed now or has been called upon me in justice and you can only deliver me from it by blessing me frequently as you have just done come up hand said the procurator.<|im_end|>", 0.13035276532173157, 0.0431382916867733, "The beggar shook his head. The crime which I have committed, my lord, has no call upon human justice. And you can only deliver me from it by blessing me frequently, as you have just done. Come be candid, said the coadjutor."], ["10", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>The baker shook his head. The crime which I have committed, my lord, has no cause of human justice. And you can only deliver me from it by blessing me frequently as you have just done. Come, put hand before the prosecutor.<|im_end|>", 0.4522962272167206, 1.3145629167556763, "The beggar shook his head. The crime which I have committed, my lord, has no call upon human justice. And you can only deliver me from it by blessing me frequently, as you have just done. Come be candid, said the coadjutor."], ["10", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>The baker shook his head, the crime which I have committed now would have no place among you in justice and you can only deliver me from it by blessing me frequently as you have just done come with candids said the procurator.<|im_end|>", -0.018617816269397736, -0.5451788902282715, "The beggar shook his head. The crime which I have committed, my lord, has no call upon human justice. And you can only deliver me from it by blessing me frequently, as you have just done. Come be candid, said the coadjutor."], ["10", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>The baker shook his head, the crime which I have committed now or has already caused me no justice, and you can only deliver me from it by blessing me secretly as you have just done. Come with candids said the prelate judge.<|im_end|>", 0.04945759102702141, -0.276334285736084, "The beggar shook his head. The crime which I have committed, my lord, has no call upon human justice. And you can only deliver me from it by blessing me frequently, as you have just done. Come be candid, said the coadjutor."], ["10", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>The beggar shook his head. The crime which I have committed, my lord, has no cause of human justice. And you can only deliver me from it by blessing me secretly as you have just done. Come up hanged said the persecutor.<|im_end|>", 0.6505840420722961, 2.097644567489624, "The beggar shook his head. The crime which I have committed, my lord, has no call upon human justice. And you can only deliver me from it by blessing me frequently, as you have just done. Come be candid, said the coadjutor."], ["10", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>The baker shook his head, the crime which I have committed now will be called by you injustice, and you can only deliver me from it by blessing us secretly as we have just done come up handed said the presider.<|im_end|>", -0.1792697161436081, -1.1796281337738037, "The beggar shook his head. The crime which I have committed, my lord, has no call upon human justice. And you can only deliver me from it by blessing me frequently, as you have just done. Come be candid, said the coadjutor."], ["10", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>The baker shook his head, the crime which I have committed now would have no place among you in justice and you can only deliver me from it by blessing me frequently as you have just done come with candids said the procurator.<|im_end|>", -0.018617816269397736, -0.5451788902282715, "The beggar shook his head. The crime which I have committed, my lord, has no call upon human justice. And you can only deliver me from it by blessing me frequently, as you have just done. Come be candid, said the coadjutor."], ["10", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>The baker shook his head. The crime which I have committed, my lord, has no place among men of justice, and you can only deliver me from it by blessing us frequently as you have just done come, I command it said the prelate jer.<|im_end|>", 0.08173446357250214, -0.1488659381866455, "The beggar shook his head. The crime which I have committed, my lord, has no call upon human justice. And you can only deliver me from it by blessing me frequently, as you have just done. Come be candid, said the coadjutor."], ["10", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>So she had buttons up, and they were gradually accumulating with the emotions that stirred within one's mind for a perverse bush way. And his seeming grey matter now stirred the remembrance that but a year before, that women were riding the house you mean the shepherd<|im_end|>", -0.7879099249839783, -0.19305643439292908, "the buttons on phelan's coat were fairly undulating with the emotions that stirred within him in his seething gray matter there stirred the remembrance that bateato had told him that women were robbing the house you mean the women"], ["10", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>So she did what was her favorite secret and tried to meditate with the emotions that stirred within one at first bushwick's heart in his seeming grey matter there stirred the remembrance that but a year ago he had been glummed for riding the house you mean to say it<|im_end|>", -1.2214081287384033, -1.8504221439361572, "the buttons on phelan's coat were fairly undulating with the emotions that stirred within him in his seething gray matter there stirred the remembrance that bateato had told him that women were robbing the house you mean the women"], ["10", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Buttons had failed to wake him, and he was still accumulating with the emotions that stirred within him when he first bushwacked in his seething grey matter there stirred the remembrance that battyappo had told him that women were riding the house you mean a woman.<|im_end|>", -0.3585851192474365, 1.4483534097671509, "the buttons on phelan's coat were fairly undulating with the emotions that stirred within him in his seething gray matter there stirred the remembrance that bateato had told him that women were robbing the house you mean the women"], ["10", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>So she did buttons of phaeton's face, and her accumulating with the emotions that stirred within him when he thought of those bushwhackers in his seething grey matter there stirred the remembrance that batty applewood had been there when they were riding the house you mean the sheriff<|im_end|>", -0.7295647859573364, 0.03001077100634575, "the buttons on phelan's coat were fairly undulating with the emotions that stirred within him in his seething gray matter there stirred the remembrance that bateato had told him that women were robbing the house you mean the women"], ["10", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Shall button some favorite speaker and start accumulating with the emotions that stirred within one heart from verse bushwick's in seeming gray matter there stirred the remembrance that but a year before that women were riding the house you mean to show me<|im_end|>", -0.5899039506912231, 0.5639670491218567, "the buttons on phelan's coat were fairly undulating with the emotions that stirred within him in his seething gray matter there stirred the remembrance that bateato had told him that women were robbing the house you mean the women"], ["10", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>So she'd bought some papers, and they kept accumulating with the emotions that stirred within one head from a first bushwick incident in seeming grey matter that stirred the remembrance that but a year before, that women were riding the house you mean the sheriff<|im_end|>", -0.8270294070243835, -0.3426194489002228, "the buttons on phelan's coat were fairly undulating with the emotions that stirred within him in his seething gray matter there stirred the remembrance that bateato had told him that women were robbing the house you mean the women"], ["10", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>To shiver buttons on pavements and paving stones, accumulating with the emotions that stirred within one night from a first bush walk in his seemingly gray matter there stirred the remembrance that boccali had told them women were robbing the house you mean the sheriff.<|im_end|>", -0.24420489370822906, 1.8856559991836548, "the buttons on phelan's coat were fairly undulating with the emotions that stirred within him in his seething gray matter there stirred the remembrance that bateato had told him that women were robbing the house you mean the women"], ["10", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>So she did what had some failing to break in, but he was accumulating with the emotions that stirred within him when he first met her. His seeming gray matter then stirred the remembrance that monte agello told him that women were riding the house you mean a woman?<|im_end|>", -0.9054762721061707, -0.6425402760505676, "the buttons on phelan's coat were fairly undulating with the emotions that stirred within him in his seething gray matter there stirred the remembrance that bateato had told him that women were robbing the house you mean the women"], ["10", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>But some failing brain, in struggling with the emotions that stirred within one's mind from the first bushwackings, had succeeded in gray matter to restore the remembrance that botyappo told them that women were robbing the house you mean a woman<|im_end|>", -0.6036410331726074, 0.5114469528198242, "the buttons on phelan's coat were fairly undulating with the emotions that stirred within him in his seething gray matter there stirred the remembrance that bateato had told him that women were robbing the house you mean the women"], ["10", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>What was on pailor's face, as she lay there accumulating with the emotions that stirred within one night from her first bush walk? It seemed in gray matter that stirred the remembrance that battyata had told them women were riding the house you mean a woman.<|im_end|>", -0.8083580732345581, -0.27123454213142395, "the buttons on phelan's coat were fairly undulating with the emotions that stirred within him in his seething gray matter there stirred the remembrance that bateato had told him that women were robbing the house you mean the women"], ["10", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>So she did what tongues of phalanx waited and eagerly accumulating with the emotions that stirred within one heart for hours bushwick's voice in seeming grey matter had stirred the remembrance that buffy applewood knew that women were rotting the house you mean a servant?<|im_end|>", -0.9248790740966797, -0.716721773147583, "the buttons on phelan's coat were fairly undulating with the emotions that stirred within him in his seething gray matter there stirred the remembrance that bateato had told him that women were robbing the house you mean the women"], ["10", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>So she had bought some table scraps and was very jubilating with the emotions that stirred within her when I first bushwaked. In his seeming gray matter, there stirred the remembrance that but a year before, that women were riding the house. You mean no shit.<|im_end|>", -0.848011314868927, -0.4228382110595703, "the buttons on phelan's coat were fairly undulating with the emotions that stirred within him in his seething gray matter there stirred the remembrance that bateato had told him that women were robbing the house you mean the women"], ["10", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>They set up the side show early in the morning before the first guests arrived at park.<|im_end|>", 0.7450000047683716, 0.012902800925076008, "They set up the sideshow early in the morning before the first guests arrived at park."], ["10", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>They set up the sideshow early in the morning before the first guest arrived at park.<|im_end|>", 0.8543975949287415, 0.8922801613807678, "They set up the sideshow early in the morning before the first guests arrived at park."], ["10", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>They set up the side show early in the morning before the first guests arrived at park.<|im_end|>", 0.7450000047683716, 0.012902800925076008, "They set up the sideshow early in the morning before the first guests arrived at park."], ["10", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>They set up the sideshow early in the morning before the first guests arrived at park.<|im_end|>", 1.0, 2.062685012817383, "They set up the sideshow early in the morning before the first guests arrived at park."], ["10", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>They set up the side show early in the morning before the first guest arrived at park.<|im_end|>", 0.5806475877761841, -1.3082213401794434, "They set up the sideshow early in the morning before the first guests arrived at park."], ["10", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>They set up the side show early in the morning before the first guests arrived at park.<|im_end|>", 0.7450000047683716, 0.012902800925076008, "They set up the sideshow early in the morning before the first guests arrived at park."], ["10", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>They set up the side show early in the morning before the first guest arrived at park.<|im_end|>", 0.5806475877761841, -1.3082213401794434, "They set up the sideshow early in the morning before the first guests arrived at park."], ["10", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>They set up the side show early in the morning before the first guest arrived at park.<|im_end|>", 0.5806475877761841, -1.3082213401794434, "They set up the sideshow early in the morning before the first guests arrived at park."], ["10", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>They set up the side show early in the morning before the first guests arrived at park.<|im_end|>", 0.7450000047683716, 0.012902800925076008, "They set up the sideshow early in the morning before the first guests arrived at park."], ["10", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>They set up the side show early in the morning before the first guests arrived at park.<|im_end|>", 0.7450000047683716, 0.012902800925076008, "They set up the sideshow early in the morning before the first guests arrived at park."], ["10", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>They set up the sideshow early in the morning before the first guest arrived at park.<|im_end|>", 0.8543975949287415, 0.8922801613807678, "They set up the sideshow early in the morning before the first guests arrived at park."], ["10", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>They set up the side show early in the morning before the first guests arrived at park.<|im_end|>", 0.7450000047683716, 0.012902800925076008, "They set up the sideshow early in the morning before the first guests arrived at park."]]}
wandb/run-20260417_125349-3c0s7mq3/files/output.log ADDED
@@ -0,0 +1,76 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ wandb: Detected [openai] in use.
2
+ wandb: Use W&B Weave for improved LLM call tracing. Install Weave with `pip install weave` then add `import weave` to the top of your script.
3
+ wandb: For more information, check out the docs at: https://weave-docs.wandb.ai/
4
+ Train: 0%| | 0/9327 [00:00<?, ?it/s]Could not estimate the number of tokens of the input, floating-point operations will not be computed
5
+ [DEBUG generate] shape= (12, 245) last_col_pad_cnt= 0 first_col_pad_cnt= 0
6
+ [DEBUG _encode] has_resp= True prompt_len= 245 resp_len= 59 full_len= 304 label_non_ignore= 59
7
+ [DEBUG _encode] has_resp= True prompt_len= 245 resp_len= 53 full_len= 298 label_non_ignore= 53
8
+ [DEBUG _encode] has_resp= True prompt_len= 245 resp_len= 53 full_len= 298 label_non_ignore= 53
9
+ [DEBUG _encode] has_resp= True prompt_len= 245 resp_len= 54 full_len= 299 label_non_ignore= 54
10
+ [DEBUG _encode] has_resp= True prompt_len= 245 resp_len= 49 full_len= 294 label_non_ignore= 49
11
+ [DEBUG _encode] has_resp= True prompt_len= 245 resp_len= 60 full_len= 305 label_non_ignore= 60
12
+ [DEBUG _encode] has_resp= True prompt_len= 245 resp_len= 57 full_len= 302 label_non_ignore= 57
13
+ [DEBUG _encode] has_resp= True prompt_len= 245 resp_len= 55 full_len= 300 label_non_ignore= 55
14
+ [DEBUG _encode] has_resp= True prompt_len= 245 resp_len= 60 full_len= 305 label_non_ignore= 60
15
+ [DEBUG _encode] has_resp= True prompt_len= 245 resp_len= 51 full_len= 296 label_non_ignore= 51
16
+ [DEBUG generate] shape= (12, 245) last_col_pad_cnt= 0 first_col_pad_cnt= 0
17
+ [DEBUG generate] shape= (12, 74) last_col_pad_cnt= 0 first_col_pad_cnt= 0
18
+ [DEBUG generate] shape= (12, 74) last_col_pad_cnt= 0 first_col_pad_cnt= 0
19
+ Train: 0%| | 8/9327 [05:07<97:17:19, 37.58s/it]
20
+ {'loss': 0.00335923, 'grad_norm': 0.40496424, 'learning_rate': 1.8e-07, 'completions/mean_length': 46.63020992, 'completions/min_length': 29.0, 'completions/max_length': 62.5, 'completions/clipped_ratio': 0.0, 'reward': -0.39390102, 'reward_std': 0.14572198, 'frac_reward_zero_std': 0.0, 'rewards/ASRWerSubLenCmpHalluDirtyV56/mean': -0.39390099, 'rewards/ASRWerSubLenCmpHalluDirtyV56/std': 0.2566371, 'kl': 0.0, 'clip_ratio/low_mean': 0.0, 'clip_ratio/low_min': 0.0, 'clip_ratio/high_mean': 0.0, 'clip_ratio/high_max': 0.0, 'clip_ratio/region_mean': 0.0, 'step_time': 22.53670275, 'epoch': 0.0, 'global_step/max_steps': '1/9327', 'elapsed_time': '45s', 'remaining_time': '4d 21h 45m 37s', 'memory(GiB)': 6.6, 'train_speed(s/it)': 45.457502}
21
+ [DEBUG generate] shape= (12, 250) last_col_pad_cnt= 0 first_col_pad_cnt= 0
22
+ [DEBUG generate] shape= (12, 250) last_col_pad_cnt= 0 first_col_pad_cnt= 0
23
+ [DEBUG generate] shape= (12, 226) last_col_pad_cnt= 0 first_col_pad_cnt= 0
24
+ [DEBUG generate] shape= (12, 226) last_col_pad_cnt= 0 first_col_pad_cnt= 0
25
+ [DEBUG generate] shape= (12, 249) last_col_pad_cnt= 0 first_col_pad_cnt= 0
26
+ [DEBUG generate] shape= (12, 249) last_col_pad_cnt= 0 first_col_pad_cnt= 0
27
+ [DEBUG generate] shape= (12, 255) last_col_pad_cnt= 0 first_col_pad_cnt= 0
28
+ [DEBUG generate] shape= (12, 255) last_col_pad_cnt= 0 first_col_pad_cnt= 0
29
+ [DEBUG generate] shape= (12, 257) last_col_pad_cnt= 0 first_col_pad_cnt= 0
30
+ [DEBUG generate] shape= (12, 257) last_col_pad_cnt= 0 first_col_pad_cnt= 0
31
+ [DEBUG generate] shape= (12, 244) last_col_pad_cnt= 0 first_col_pad_cnt= 0
32
+ [DEBUG generate] shape= (12, 244) last_col_pad_cnt= 0 first_col_pad_cnt= 0
33
+ [DEBUG generate] shape= (12, 253) last_col_pad_cnt= 0 first_col_pad_cnt= 0
34
+ [DEBUG generate] shape= (12, 253) last_col_pad_cnt= 0 first_col_pad_cnt= 0
35
+ [DEBUG generate] shape= (12, 254) last_col_pad_cnt= 0 first_col_pad_cnt= 0
36
+ [DEBUG generate] shape= (12, 254) last_col_pad_cnt= 0 first_col_pad_cnt= 0
37
+ {'loss': 0.00341008, 'grad_norm': 0.55847734, 'learning_rate': 8.9e-07, 'completions/mean_length': 50.98437619, 'completions/min_length': 33.875, 'completions/max_length': 64.0625, 'completions/clipped_ratio': 0.0, 'reward': -0.02726497, 'reward_std': 0.16105477, 'frac_reward_zero_std': 0.0, 'rewards/ASRWerSubLenCmpHalluDirtyV56/mean': -0.02726497, 'rewards/ASRWerSubLenCmpHalluDirtyV56/std': 0.40726903, 'kl': 0.0036334, 'clip_ratio/low_mean': 0.01024817, 'clip_ratio/low_min': 0.00230935, 'clip_ratio/high_mean': 0.0056009, 'clip_ratio/high_max': 0.01153785, 'clip_ratio/region_mean': 0.01584908, 'step_time': 18.11644147, 'epoch': 0.0, 'global_step/max_steps': '5/9327', 'elapsed_time': '3m 15s', 'remaining_time': '4d 5h 3m 13s', 'memory(GiB)': 6.7, 'train_speed(s/it)': 39.025256}
38
+ [DEBUG generate] shape= (12, 239) last_col_pad_cnt= 0 first_col_pad_cnt= 0
39
+ [DEBUG generate] shape= (12, 239) last_col_pad_cnt= 0 first_col_pad_cnt= 0
40
+ [DEBUG generate] shape= (12, 246) last_col_pad_cnt= 0 first_col_pad_cnt= 0
41
+ [DEBUG generate] shape= (12, 246) last_col_pad_cnt= 0 first_col_pad_cnt= 0
42
+ [DEBUG generate] shape= (12, 135) last_col_pad_cnt= 0 first_col_pad_cnt= 0
43
+ [DEBUG generate] shape= (12, 135) last_col_pad_cnt= 0 first_col_pad_cnt= 0
44
+ [DEBUG generate] shape= (12, 221) last_col_pad_cnt= 0 first_col_pad_cnt= 0
45
+ [DEBUG generate] shape= (12, 221) last_col_pad_cnt= 0 first_col_pad_cnt= 0
46
+ [DEBUG generate] shape= (12, 244) last_col_pad_cnt= 0 first_col_pad_cnt= 0
47
+ [DEBUG generate] shape= (12, 244) last_col_pad_cnt= 0 first_col_pad_cnt= 0
48
+ [DEBUG generate] shape= (12, 236) last_col_pad_cnt= 0 first_col_pad_cnt= 0
49
+ [DEBUG generate] shape= (12, 236) last_col_pad_cnt= 0 first_col_pad_cnt= 0
50
+ [DEBUG generate] shape= (12, 244) last_col_pad_cnt= 0 first_col_pad_cnt= 0
51
+ [DEBUG generate] shape= (12, 244) last_col_pad_cnt= 0 first_col_pad_cnt= 0
52
+ [DEBUG generate] shape= (12, 244) last_col_pad_cnt= 0 first_col_pad_cnt= 0
53
+ [DEBUG generate] shape= (12, 244) last_col_pad_cnt= 0 first_col_pad_cnt= 0
54
+ [DEBUG generate] shape= (12, 236) last_col_pad_cnt= 0 first_col_pad_cnt= 0
55
+ [DEBUG generate] shape= (12, 236) last_col_pad_cnt= 0 first_col_pad_cnt= 0
56
+ [DEBUG generate] shape= (12, 238) last_col_pad_cnt= 0 first_col_pad_cnt= 0
57
+ [DEBUG generate] shape= (12, 238) last_col_pad_cnt= 0 first_col_pad_cnt= 0
58
+ {'loss': 0.00361177, 'grad_norm': 0.37292629, 'learning_rate': 1.79e-06, 'completions/mean_length': 51.17916794, 'completions/min_length': 35.95, 'completions/max_length': 65.9, 'completions/clipped_ratio': 0.0, 'reward': -0.01967886, 'reward_std': 0.1592014, 'frac_reward_zero_std': 0.0, 'rewards/ASRWerSubLenCmpHalluDirtyV56/mean': -0.01967885, 'rewards/ASRWerSubLenCmpHalluDirtyV56/std': 0.47400118, 'kl': 0.00512733, 'clip_ratio/low_mean': 0.01430356, 'clip_ratio/low_min': 0.00256842, 'clip_ratio/high_mean': 0.00864687, 'clip_ratio/high_max': 0.01792681, 'clip_ratio/region_mean': 0.02295043, 'step_time': 18.99083556, 'epoch': 0.0, 'global_step/max_steps': '10/9327', 'elapsed_time': '6m 28s', 'remaining_time': '4d 4h 26m 47s', 'memory(GiB)': 6.7, 'train_speed(s/it)': 38.811493}
59
+ [DEBUG generate] shape= (12, 223) last_col_pad_cnt= 0 first_col_pad_cnt= 0
60
+ [DEBUG generate] shape= (12, 223) last_col_pad_cnt= 0 first_col_pad_cnt= 0
61
+ [DEBUG generate] shape= (12, 241) last_col_pad_cnt= 0 first_col_pad_cnt= 0
62
+ [DEBUG generate] shape= (12, 241) last_col_pad_cnt= 0 first_col_pad_cnt= 0
63
+ [DEBUG generate] shape= (12, 193) last_col_pad_cnt= 0 first_col_pad_cnt= 0
64
+ [DEBUG generate] shape= (12, 193) last_col_pad_cnt= 0 first_col_pad_cnt= 0
65
+ [DEBUG generate] shape= (12, 246) last_col_pad_cnt= 0 first_col_pad_cnt= 0
66
+ [DEBUG generate] shape= (12, 246) last_col_pad_cnt= 0 first_col_pad_cnt= 0
67
+ [DEBUG generate] shape= (12, 252) last_col_pad_cnt= 0 first_col_pad_cnt= 0
68
+ [DEBUG generate] shape= (12, 252) last_col_pad_cnt= 0 first_col_pad_cnt= 0
69
+ [DEBUG generate] shape= (12, 252) last_col_pad_cnt= 0 first_col_pad_cnt= 0
70
+ [DEBUG generate] shape= (12, 252) last_col_pad_cnt= 0 first_col_pad_cnt= 0
71
+ [DEBUG generate] shape= (12, 248) last_col_pad_cnt= 0 first_col_pad_cnt= 0
72
+ [DEBUG generate] shape= (12, 248) last_col_pad_cnt= 0 first_col_pad_cnt= 0
73
+ [DEBUG generate] shape= (12, 231) last_col_pad_cnt= 0 first_col_pad_cnt= 0
74
+ [DEBUG generate] shape= (12, 231) last_col_pad_cnt= 0 first_col_pad_cnt= 0
75
+ [DEBUG generate] shape= (12, 247) last_col_pad_cnt= 0 first_col_pad_cnt= 0
76
+ [DEBUG generate] shape= (12, 247) last_col_pad_cnt= 0 first_col_pad_cnt= 0
wandb/run-20260417_125349-3c0s7mq3/files/requirements.txt ADDED
@@ -0,0 +1,255 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ psutil==7.2.2
2
+ colorama==0.4.6
3
+ typing-inspection==0.4.2
4
+ dill==0.3.8
5
+ aliyun-python-sdk-kms==2.16.5
6
+ urllib3==2.6.3
7
+ torch==2.6.0
8
+ threadpoolctl==3.6.0
9
+ pyzmq==27.1.0
10
+ astor==0.8.1
11
+ hf-xet==1.4.3
12
+ sniffio==1.3.1
13
+ tensorboard==2.20.0
14
+ fastar==0.11.0
15
+ llvmlite==0.43.0
16
+ pathspec==1.0.4
17
+ mkl_fft==1.3.11
18
+ prometheus_client==0.25.0
19
+ async-timeout==5.0.1
20
+ scikit-learn==1.7.2
21
+ sortedcontainers==2.4.0
22
+ Bottleneck==1.4.2
23
+ orjson==3.11.8
24
+ nest-asyncio==1.6.0
25
+ cupy-cuda12x==13.6.0
26
+ semantic-version==2.10.0
27
+ aiosignal==1.4.0
28
+ fsspec==2025.3.0
29
+ dyNET38==2.2
30
+ shellingham==1.5.4
31
+ zstandard==0.25.0
32
+ PyYAML==6.0.3
33
+ nvidia-curand-cu12==10.3.5.147
34
+ gradio==5.50.0
35
+ Werkzeug==3.1.8
36
+ grpcio==1.80.0
37
+ aiohttp==3.13.5
38
+ Flask==3.1.3
39
+ python-json-logger==4.1.0
40
+ trl==0.29.1
41
+ nltk==3.9.4
42
+ platformdirs==4.9.6
43
+ lm-format-enforcer==0.10.12
44
+ pyparsing==3.3.2
45
+ jmespath==0.10.0
46
+ starlette==0.52.1
47
+ crcmod==1.7
48
+ dnspython==2.8.0
49
+ antlr4-python3-runtime==4.9.3
50
+ rouge==1.0.1
51
+ importlib_metadata==9.0.0
52
+ nvidia-cudnn-cu12==9.1.0.70
53
+ safetensors==0.7.0
54
+ blake3==1.0.8
55
+ interegular==0.3.3
56
+ tiktoken==0.11.0
57
+ pydantic_core==2.41.4
58
+ outlines==0.1.11
59
+ airportsdata==20260315
60
+ rich-toolkit==0.19.7
61
+ multiprocess==0.70.16
62
+ sympy==1.13.1
63
+ psutil==7.2.2
64
+ h11==0.16.0
65
+ anyio==4.13.0
66
+ Cython==3.2.4
67
+ outlines_core==0.1.26
68
+ jsonschema==4.26.0
69
+ nvidia-cuda-cupti-cu12==12.4.127
70
+ meson-python==0.19.0
71
+ depyf==0.18.0
72
+ audioread==3.1.0
73
+ typer==0.24.1
74
+ nvidia-cuda-nvrtc-cu12==12.4.127
75
+ joblib==1.5.3
76
+ torchvision==0.21.0
77
+ hf-gradio==0.3.2
78
+ huggingface_hub==0.36.2
79
+ websockets==15.0.1
80
+ diskcache==5.6.3
81
+ mistral_common==1.11.0
82
+ partial-json-parser==0.2.1.1.post7
83
+ simplejson==3.20.2
84
+ watchfiles==1.1.1
85
+ Jinja2==3.1.6
86
+ GitPython==3.1.46
87
+ numexpr==2.11.0
88
+ pydub==0.25.1
89
+ brotli==1.2.0
90
+ binpacking==2.0.1
91
+ cmake==4.3.1
92
+ pydantic==2.12.3
93
+ mkl-service==2.4.0
94
+ protobuf==6.33.6
95
+ gguf==0.10.0
96
+ MarkupSafe==3.0.3
97
+ exceptiongroup==1.3.1
98
+ markdown-it-py==4.0.0
99
+ soxr==1.0.0
100
+ pyarrow==20.0.0
101
+ tqdm==4.67.3
102
+ meson==1.11.0
103
+ fonttools==4.62.1
104
+ annotated-types==0.7.0
105
+ networkx==3.4.2
106
+ nvidia-cuda-runtime-cu12==12.4.127
107
+ compressed-tensors==0.9.2
108
+ wandb==0.23.0
109
+ mdurl==0.1.2
110
+ charset-normalizer==3.4.7
111
+ Pygments==2.20.0
112
+ zipp==3.23.1
113
+ prometheus-fastapi-instrumentator==7.1.0
114
+ aiofiles==24.1.0
115
+ lark==1.2.2
116
+ addict==2.4.0
117
+ pydantic-settings==2.13.1
118
+ opencv-python-headless==4.11.0.86
119
+ certifi==2026.2.25
120
+ sox==1.5.0
121
+ nagisa==0.2.11
122
+ six==1.17.0
123
+ tokenizers==0.22.2
124
+ mkl_random==1.2.8
125
+ fastapi-cloud-cli==0.17.0
126
+ propcache==0.4.1
127
+ cachetools==7.0.5
128
+ rpds-py==0.30.0
129
+ torchaudio==2.6.0
130
+ setuptools==82.0.1
131
+ py-cpuinfo==9.0.0
132
+ tomli==2.4.1
133
+ xxhash==3.6.0
134
+ pip==26.0.1
135
+ contourpy==1.3.2
136
+ absl-py==2.4.0
137
+ mpmath==1.3.0
138
+ ms_swift==4.0.3
139
+ pyproject-metadata==0.11.0
140
+ aiohappyeyeballs==2.6.1
141
+ httpx==0.28.1
142
+ json_repair==0.59.4
143
+ blinker==1.9.0
144
+ tzdata==2025.3
145
+ tensorboard-data-server==0.7.2
146
+ pydantic-extra-types==2.11.1
147
+ Markdown==3.10.2
148
+ nvidia-cusparselt-cu12==0.6.2
149
+ rignore==0.7.6
150
+ openai==2.32.0
151
+ soundfile==0.13.1
152
+ lazy-loader==0.5
153
+ av==14.2.0
154
+ yarl==1.23.0
155
+ python-dateutil==2.9.0.post0
156
+ groovy==0.1.2
157
+ xformers==0.0.29.post2
158
+ qwen-omni-utils==0.0.9
159
+ rich==15.0.0
160
+ xgrammar==0.1.16
161
+ numba==0.60.0
162
+ nvidia-cusolver-cu12==11.6.1.9
163
+ scikit_build_core==0.12.2
164
+ ffmpy==1.0.0
165
+ wheel==0.46.3
166
+ jiter==0.14.0
167
+ oss2==2.19.1
168
+ transformers==4.57.6
169
+ fastrlock==0.8.3
170
+ click==8.3.2
171
+ pooch==1.9.0
172
+ distro==1.9.0
173
+ nvidia-cublas-cu12==12.4.5.8
174
+ regex==2026.4.4
175
+ cpm-kernels==1.0.11
176
+ safehttpx==0.1.7
177
+ matplotlib==3.10.8
178
+ httptools==0.7.1
179
+ nvidia-cusparse-cu12==12.3.1.170
180
+ qwen-asr==0.0.6
181
+ gradio_client==1.14.0
182
+ gitdb==4.0.12
183
+ fastapi-cli==0.0.24
184
+ soynlp==0.0.493
185
+ python-dotenv==1.2.2
186
+ nvidia-cufft-cu12==11.2.1.3
187
+ accelerate==1.12.0
188
+ tomlkit==0.13.3
189
+ triton==3.2.0
190
+ filelock==3.28.0
191
+ pycountry==26.2.16
192
+ modelscope==1.35.4
193
+ annotated-doc==0.0.4
194
+ referencing==0.37.0
195
+ numpy==1.26.4
196
+ aliyun-python-sdk-core==2.16.0
197
+ attrs==26.1.0
198
+ vllm==0.8.0
199
+ python-multipart==0.0.26
200
+ jsonschema-specifications==2025.9.1
201
+ idna==3.11
202
+ scipy==1.15.3
203
+ typing_extensions==4.15.0
204
+ itsdangerous==2.2.0
205
+ msgspec==0.21.1
206
+ msgpack==1.1.2
207
+ nvidia-nvjitlink-cu12==12.4.127
208
+ pycryptodome==3.23.0
209
+ ninja==1.13.0
210
+ pillow==11.3.0
211
+ email-validator==2.3.0
212
+ cryptography==46.0.7
213
+ peft==0.18.1
214
+ kiwisolver==1.5.0
215
+ cffi==2.0.0
216
+ einops==0.8.2
217
+ pytz==2026.1.post1
218
+ uvloop==0.22.1
219
+ requests==2.33.1
220
+ sentencepiece==0.2.1
221
+ attrdict==2.0.1
222
+ dacite==1.9.2
223
+ cloudpickle==3.1.2
224
+ ray==2.55.0
225
+ fastapi==0.135.3
226
+ librosa==0.11.0
227
+ ruff==0.15.10
228
+ multidict==6.7.1
229
+ smmap==5.0.3
230
+ packaging==26.0
231
+ pycparser==3.0
232
+ decorator==5.2.1
233
+ transformers-stream-generator==0.0.5
234
+ nvidia-nccl-cu12==2.21.5
235
+ frozenlist==1.8.0
236
+ uvicorn==0.44.0
237
+ datasets==3.6.0
238
+ cycler==0.12.1
239
+ omegaconf==2.3.0
240
+ httpcore==1.0.9
241
+ pandas==2.3.2
242
+ nvidia-nvtx-cu12==12.4.127
243
+ sentry-sdk==2.58.0
244
+ wheel==0.46.3
245
+ autocommand==2.2.2
246
+ tomli==2.4.0
247
+ packaging==26.0
248
+ more-itertools==10.8.0
249
+ zipp==3.23.0
250
+ platformdirs==4.4.0
251
+ jaraco.context==6.1.0
252
+ jaraco.text==4.0.0
253
+ backports.tarfile==1.2.0
254
+ jaraco.functools==4.4.0
255
+ importlib_metadata==8.7.1
wandb/run-20260417_125349-3c0s7mq3/files/wandb-metadata.json ADDED
@@ -0,0 +1,224 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "os": "Linux-3.10.0-957.el7.x86_64-x86_64-with-glibc2.17",
3
+ "python": "CPython 3.10.18",
4
+ "startedAt": "2026-04-17T04:53:49.174280Z",
5
+ "args": [
6
+ "--rlhf_type",
7
+ "grpo",
8
+ "--external_plugins",
9
+ "/mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/0416upload/my_qwen3_asr_dapo_register.py",
10
+ "/mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/0416upload/0417_reward.py",
11
+ "--model",
12
+ "/mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/qwen3-asr-merged",
13
+ "--model_type",
14
+ "my_qwen3_asr_rl",
15
+ "--template",
16
+ "my_qwen3_asr_rl",
17
+ "--dataset",
18
+ "/mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/0416upload/lora_0323_10w+55w+error+syn_with_domain_train90_targeted_rl_train90_loramerged_basewer_3suppress_server.jsonl",
19
+ "--val_dataset",
20
+ "/mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/0416upload/lora_0323_10w+55w+error+syn_with_domain_train90_targeted_rl_val5_sample5p_server.jsonl",
21
+ "--reward_funcs",
22
+ "asr_wer_sub_len_cmp_hallu_dirty_v56",
23
+ "--train_type",
24
+ "lora",
25
+ "--use_vllm",
26
+ "false",
27
+ "--log_completions",
28
+ "true",
29
+ "--loss_type",
30
+ "dapo",
31
+ "--advantage_estimator",
32
+ "grpo",
33
+ "--scale_rewards",
34
+ "group",
35
+ "--num_iterations",
36
+ "2",
37
+ "--beta",
38
+ "0.04",
39
+ "--epsilon_high",
40
+ "0.28",
41
+ "--dynamic_sample",
42
+ "true",
43
+ "--max_resample_times",
44
+ "4",
45
+ "--overlong_filter",
46
+ "true",
47
+ "--truncation_strategy",
48
+ "delete",
49
+ "--num_generations",
50
+ "12",
51
+ "--generation_batch_size",
52
+ "48",
53
+ "--per_device_train_batch_size",
54
+ "4",
55
+ "--per_device_eval_batch_size",
56
+ "4",
57
+ "--gradient_accumulation_steps",
58
+ "12",
59
+ "--num_generations_eval",
60
+ "4",
61
+ "--max_completion_length",
62
+ "256",
63
+ "--temperature",
64
+ "0.50",
65
+ "--top_p",
66
+ "0.95",
67
+ "--top_k",
68
+ "50",
69
+ "--repetition_penalty",
70
+ "1.08",
71
+ "--learning_rate",
72
+ "5e-5",
73
+ "--lr_scheduler_type",
74
+ "cosine",
75
+ "--warmup_ratio",
76
+ "0.03",
77
+ "--report_to",
78
+ "wandb",
79
+ "--run_name",
80
+ "qwen3asr_dapo_reward56_4x4x12_12gen_4GPU",
81
+ "--output_dir",
82
+ "/mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/0416upload/out/qwen3asr_dapo_reward56_4x4x12_12gen_4GPU",
83
+ "--save_strategy",
84
+ "steps",
85
+ "--save_steps",
86
+ "20",
87
+ "--logging_steps",
88
+ "5",
89
+ "--freeze_llm",
90
+ "false",
91
+ "--freeze_vit",
92
+ "false",
93
+ "--freeze_aligner",
94
+ "false",
95
+ "--remove_unused_columns",
96
+ "false",
97
+ "--padding_side",
98
+ "left"
99
+ ],
100
+ "program": "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/lib/python3.10/site-packages/swift/cli/rlhf.py",
101
+ "email": "pang_kaiyu@163.com",
102
+ "root": "/mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/0416upload",
103
+ "host": "SH-IDC1-10-140-37-28",
104
+ "executable": "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/bin/python3.10",
105
+ "cpu_count": 64,
106
+ "cpu_count_logical": 128,
107
+ "gpu": "NVIDIA A100-SXM4-80GB",
108
+ "gpu_count": 8,
109
+ "disk": {
110
+ "/": {
111
+ "total": "524945911808",
112
+ "used": "49879580672"
113
+ }
114
+ },
115
+ "memory": {
116
+ "total": "1081627828224"
117
+ },
118
+ "gpu_nvidia": [
119
+ {
120
+ "name": "NVIDIA A100-SXM4-80GB",
121
+ "memoryTotal": "85899345920",
122
+ "cudaCores": 6912,
123
+ "architecture": "Ampere",
124
+ "uuid": "GPU-3da6624c-f6f7-fce6-4711-27acab73dc93"
125
+ },
126
+ {
127
+ "name": "NVIDIA A100-SXM4-80GB",
128
+ "memoryTotal": "85899345920",
129
+ "cudaCores": 6912,
130
+ "architecture": "Ampere",
131
+ "uuid": "GPU-dae83544-a631-a3fe-b5d5-e4fdd056c7a8"
132
+ },
133
+ {
134
+ "name": "NVIDIA A100-SXM4-80GB",
135
+ "memoryTotal": "85899345920",
136
+ "cudaCores": 6912,
137
+ "architecture": "Ampere",
138
+ "uuid": "GPU-621aa0b9-4a32-d349-8a16-20b8b6f0dde4"
139
+ },
140
+ {
141
+ "name": "NVIDIA A100-SXM4-80GB",
142
+ "memoryTotal": "85899345920",
143
+ "cudaCores": 6912,
144
+ "architecture": "Ampere",
145
+ "uuid": "GPU-642bed5e-3bf1-b5e0-8aba-33f8f64a5dcc"
146
+ },
147
+ {
148
+ "name": "NVIDIA A100-SXM4-80GB",
149
+ "memoryTotal": "85899345920",
150
+ "cudaCores": 6912,
151
+ "architecture": "Ampere",
152
+ "uuid": "GPU-6c70bd3b-1e58-bd2a-a10b-19891e3eab9a"
153
+ },
154
+ {
155
+ "name": "NVIDIA A100-SXM4-80GB",
156
+ "memoryTotal": "85899345920",
157
+ "cudaCores": 6912,
158
+ "architecture": "Ampere",
159
+ "uuid": "GPU-96e9e2d3-6436-3c7f-5a20-1d4a32e7992c"
160
+ },
161
+ {
162
+ "name": "NVIDIA A100-SXM4-80GB",
163
+ "memoryTotal": "85899345920",
164
+ "cudaCores": 6912,
165
+ "architecture": "Ampere",
166
+ "uuid": "GPU-dba7546f-0cda-e659-ca1d-4790c27ffe8d"
167
+ },
168
+ {
169
+ "name": "NVIDIA A100-SXM4-80GB",
170
+ "memoryTotal": "85899345920",
171
+ "cudaCores": 6912,
172
+ "architecture": "Ampere",
173
+ "uuid": "GPU-b0a96cf9-74f3-969a-e8d0-5a30f3f06d1e"
174
+ }
175
+ ],
176
+ "cudaVersion": "12.4",
177
+ "slurm": {
178
+ "cluster_name": "cluster_sproject3",
179
+ "conf": "/etc/slurm/slurm.conf",
180
+ "cpus_on_node": "2",
181
+ "gtids": "0",
182
+ "job_account": "research",
183
+ "job_cpus_per_node": "2",
184
+ "job_gid": "800000689",
185
+ "job_id": "8568855",
186
+ "job_name": "qwen3_asr_train_4gpu",
187
+ "job_nodelist": "SH-IDC1-10-140-37-28",
188
+ "job_num_nodes": "1",
189
+ "job_partition": "interntmp",
190
+ "job_qos": "normal",
191
+ "job_uid": "800000689",
192
+ "job_user": "panjiabao",
193
+ "jobid": "8568855",
194
+ "launch_node_ipaddr": "10.140.37.164",
195
+ "localid": "0",
196
+ "nnodes": "1",
197
+ "nodeid": "0",
198
+ "nodelist": "SH-IDC1-10-140-37-28",
199
+ "nprocs": "1",
200
+ "ntasks": "1",
201
+ "ntasks_per_node": "1",
202
+ "prio_process": "0",
203
+ "procid": "0",
204
+ "srun_comm_host": "10.140.37.164",
205
+ "srun_comm_port": "39944",
206
+ "step_gpus": "4,5,6,7",
207
+ "step_id": "0",
208
+ "step_launcher_port": "39944",
209
+ "step_nodelist": "SH-IDC1-10-140-37-28",
210
+ "step_num_nodes": "1",
211
+ "step_num_tasks": "1",
212
+ "step_tasks_per_node": "1",
213
+ "stepid": "0",
214
+ "submit_dir": "/mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/0416upload",
215
+ "submit_host": "SH-IDC1-10-140-37-164",
216
+ "task_pid": "253884",
217
+ "tasks_per_node": "1",
218
+ "topology_addr": "SH-IDC1-10-140-37-28",
219
+ "topology_addr_pattern": "node",
220
+ "umask": "0002",
221
+ "working_cluster": "cluster_sproject3:SH-IDC1-10-140-37-161:6817:9216:109"
222
+ },
223
+ "writerId": "j5sm4ok14e8glxftszvcldkdpfaj9tjk"
224
+ }
wandb/run-20260417_125349-3c0s7mq3/files/wandb-summary.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"profiling/Time taken: GRPOTrainer._prepare_inputs":1.0380055755376816e-05,"train/clip_ratio/low_min":0.0025684179776969056,"completions":{"artifact_path":"wandb-client-artifact://uxb8hpe90ova7jczka8irjgjvda1abucqjkcj2xforoqlkmgy8m2ogk528hkqzciqt27cmh80q6ooyt95k6jpzt8j12bp5out3isrdz6jt3e0rqqyb8j8sbkeuw9z88u/completions.table.json","ncols":6,"sha256":"510c5f07b145276e42100fb7a1579a1a90630c3d4b603b455e0179b2425e7ba9","size":27491,"log_mode":"IMMUTABLE","_latest_artifact_path":"wandb-client-artifact://c0nc1huy2dg0glf8439n1pxjl0jfm9ih2xohqkvhrckav2b6emj75t25u8r70nmykdappetknoyherfthhsx0dnv0iba9azrtgonx2q7fd4ur4g65wplov58boq40hos:latest/completions.table.json","nrows":48,"_type":"table-file","path":"media/table/completions_5_510c5f07b145276e4210.table.json"},"train/step_time":18.990835564490407,"profiling/Time taken: GRPOTrainer._generate_and_score_completions":6.459590430138633,"profiling/Time taken: GRPOTrainer._dynamic_sampling":0.0027582282200455666,"train/frac_reward_zero_std":0,"train/rewards/ASRWerSubLenCmpHalluDirtyV56/mean":-0.01967885121703148,"train/completions/clipped_ratio":0,"train/clip_ratio/high_max":0.01792680664608876,"train/epoch":0.0032164683177870698,"profiling/Time taken: GRPOTrainer.compute_loss":0.42181658814661205,"train/kl":0.005127331020776183,"_step":6,"train/clip_ratio/region_mean":0.022950426349416374,"train/clip_ratio/low_mean":0.014303557314754774,"train/rewards/ASRWerSubLenCmpHalluDirtyV56/std":0.4740011841058731,"profiling/Time taken: GRPOTrainer.log_metrics":0.021599401021376252,"profiling/Time taken: GRPOTrainer.resample_encode_failed_inputs":0.09793815203011036,"train/learning_rate":1.7857142857142857e-06,"train/clip_ratio/high_mean":0.008646869304357097,"train/reward":-0.019678859598934652,"train/completions/mean_length":51.179167938232425,"train/grad_norm":0.3729262948036194,"train/completions/max_length":65.9,"train/reward_std":0.15920140147209166,"train/completions/min_length":35.95,"train/loss":0.003611765429377556,"_timestamp":1.7764021900309644e+09,"_wandb":{"runtime":559},"profiling/Time taken: GRPOTrainer._get_per_token_logps_and_entropies":0.3787236858624965,"profiling/Time taken: GRPOTrainer._prepare_batch_inputs":1.4868471620138735,"profiling/Time taken: GRPOTrainer._score_completions":0.1824264999013394,"profiling/Time taken: GRPOTrainer.generate":4.603045840980485,"_runtime":559.310393838,"train/global_step":10,"profiling/Time taken: GRPOTrainer.ASRWerSubLenCmpHalluDirtyV56":0.18123672483488917}
wandb/run-20260417_125349-3c0s7mq3/logs/debug-core.log ADDED
@@ -0,0 +1,11 @@
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {"time":"2026-04-17T12:53:49.510806063+08:00","level":"INFO","msg":"main: starting server","port-filename":"/tmp/tmp9sgje0qy/port-255159.txt","pid":255159,"log-level":0,"disable-analytics":false,"shutdown-on-parent-exit":false,"enable-dcgm-profiling":false}
2
+ {"time":"2026-04-17T12:53:49.512883475+08:00","level":"INFO","msg":"server: will exit if parent process dies","ppid":255159}
3
+ {"time":"2026-04-17T12:53:49.512897523+08:00","level":"INFO","msg":"server: accepting connections","addr":{"Name":"/tmp/wandb-255159-255838-1984267321/socket","Net":"unix"}}
4
+ {"time":"2026-04-17T12:53:49.589507097+08:00","level":"INFO","msg":"connection: ManageConnectionData: new connection created","id":"1(@)"}
5
+ {"time":"2026-04-17T12:53:49.596836313+08:00","level":"INFO","msg":"handleInformInit: received","streamId":"3c0s7mq3","id":"1(@)"}
6
+ {"time":"2026-04-17T12:53:50.060383382+08:00","level":"INFO","msg":"handleInformInit: stream started","streamId":"3c0s7mq3","id":"1(@)"}
7
+ {"time":"2026-04-17T13:03:10.120189546+08:00","level":"INFO","msg":"handleInformTeardown: server teardown initiated","id":"1(@)"}
8
+ {"time":"2026-04-17T13:03:10.120718112+08:00","level":"INFO","msg":"server is shutting down"}
9
+ {"time":"2026-04-17T13:03:10.120709431+08:00","level":"INFO","msg":"connection: closing","id":"1(@)"}
10
+ {"time":"2026-04-17T13:03:10.1212097+08:00","level":"INFO","msg":"server: listener closed","addr":{"Name":"/tmp/wandb-255159-255838-1984267321/socket","Net":"unix"}}
11
+ {"time":"2026-04-17T13:03:10.121584463+08:00","level":"INFO","msg":"connection: closed successfully","id":"1(@)"}
wandb/run-20260417_125349-3c0s7mq3/logs/debug-internal.log ADDED
@@ -0,0 +1,11 @@
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {"time":"2026-04-17T12:53:49.599295874+08:00","level":"INFO","msg":"stream: starting","core version":"0.23.0"}
2
+ {"time":"2026-04-17T12:53:50.056880322+08:00","level":"INFO","msg":"stream: created new stream","id":"3c0s7mq3"}
3
+ {"time":"2026-04-17T12:53:50.056952984+08:00","level":"INFO","msg":"handler: started","stream_id":"3c0s7mq3"}
4
+ {"time":"2026-04-17T12:53:50.060375782+08:00","level":"INFO","msg":"stream: started","id":"3c0s7mq3"}
5
+ {"time":"2026-04-17T12:53:50.060385935+08:00","level":"INFO","msg":"sender: started","stream_id":"3c0s7mq3"}
6
+ {"time":"2026-04-17T12:53:50.060388859+08:00","level":"INFO","msg":"writer: started","stream_id":"3c0s7mq3"}
7
+ {"time":"2026-04-17T13:03:10.120719587+08:00","level":"INFO","msg":"stream: closing","id":"3c0s7mq3"}
8
+ {"time":"2026-04-17T13:03:11.075949443+08:00","level":"INFO","msg":"fileTransfer: Close: file transfer manager closed"}
9
+ {"time":"2026-04-17T13:03:12.765331132+08:00","level":"INFO","msg":"handler: closed","stream_id":"3c0s7mq3"}
10
+ {"time":"2026-04-17T13:03:12.766657126+08:00","level":"INFO","msg":"sender: closed","stream_id":"3c0s7mq3"}
11
+ {"time":"2026-04-17T13:03:12.766668686+08:00","level":"INFO","msg":"stream: closed","id":"3c0s7mq3"}
wandb/run-20260417_125349-3c0s7mq3/logs/debug.log ADDED
@@ -0,0 +1,26 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ 2026-04-17 12:53:49,233 INFO MainThread:255159 [wandb_setup.py:_flush():80] Current SDK version is 0.23.0
2
+ 2026-04-17 12:53:49,233 INFO MainThread:255159 [wandb_setup.py:_flush():80] Configure stats pid to 255159
3
+ 2026-04-17 12:53:49,233 INFO MainThread:255159 [wandb_setup.py:_flush():80] Loading settings from /mnt/petrelfs/panjiabao/.config/wandb/settings
4
+ 2026-04-17 12:53:49,233 INFO MainThread:255159 [wandb_setup.py:_flush():80] Loading settings from /mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/0416upload/wandb/settings
5
+ 2026-04-17 12:53:49,233 INFO MainThread:255159 [wandb_setup.py:_flush():80] Loading settings from environment variables
6
+ 2026-04-17 12:53:49,233 INFO MainThread:255159 [wandb_init.py:setup_run_log_directory():713] Logging user logs to /mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/0416upload/wandb/run-20260417_125349-3c0s7mq3/logs/debug.log
7
+ 2026-04-17 12:53:49,233 INFO MainThread:255159 [wandb_init.py:setup_run_log_directory():714] Logging internal logs to /mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/0416upload/wandb/run-20260417_125349-3c0s7mq3/logs/debug-internal.log
8
+ 2026-04-17 12:53:49,233 INFO MainThread:255159 [wandb_init.py:init():840] calling init triggers
9
+ 2026-04-17 12:53:49,233 INFO MainThread:255159 [wandb_init.py:init():845] wandb.init called with sweep_config: {}
10
+ config: {'_wandb': {}}
11
+ 2026-04-17 12:53:49,233 INFO MainThread:255159 [wandb_init.py:init():888] starting backend
12
+ 2026-04-17 12:53:49,589 INFO MainThread:255159 [wandb_init.py:init():891] sending inform_init request
13
+ 2026-04-17 12:53:49,594 INFO MainThread:255159 [wandb_init.py:init():899] backend started and connected
14
+ 2026-04-17 12:53:49,598 INFO MainThread:255159 [wandb_init.py:init():969] updated telemetry
15
+ 2026-04-17 12:53:49,599 INFO MainThread:255159 [wandb_init.py:init():993] communicating run to backend with 90.0 second timeout
16
+ 2026-04-17 12:53:50,809 INFO MainThread:255159 [wandb_init.py:init():1040] starting run threads in backend
17
+ 2026-04-17 12:53:51,513 INFO MainThread:255159 [wandb_run.py:_console_start():2504] atexit reg
18
+ 2026-04-17 12:53:51,514 INFO MainThread:255159 [wandb_run.py:_redirect():2352] redirect: wrap_raw
19
+ 2026-04-17 12:53:51,514 INFO MainThread:255159 [wandb_run.py:_redirect():2421] Wrapping output streams.
20
+ 2026-04-17 12:53:51,514 INFO MainThread:255159 [wandb_run.py:_redirect():2444] Redirects installed.
21
+ 2026-04-17 12:53:51,521 INFO MainThread:255159 [wandb_init.py:init():1080] run started, returning control to user process
22
+ 2026-04-17 12:53:51,528 INFO MainThread:255159 [wandb_run.py:_config_callback():1385] config_cb None None {'peft_config': {'default': {'task_type': 'CAUSAL_LM', 'peft_type': 'LORA', 'auto_mapping': None, 'peft_version': '0.18.1', 'base_model_name_or_path': '/mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/qwen3-asr-merged', 'revision': None, 'inference_mode': False, 'r': 8, 'target_modules': '^(thinker\\.model(?=\\.).*\\.(k_proj|q_proj|down_proj|up_proj|v_proj|gate_proj|o_proj)|thinker\\.audio_tower\\.layers(?=\\.).*\\.(k_proj|fc1|fc2|q_proj|out_proj|v_proj)|thinker\\.audio_tower\\.conv_out(?=\\.)|thinker\\.audio_tower\\.proj1(?=\\.)|thinker\\.audio_tower\\.proj2(?=\\.))$', 'exclude_modules': None, 'lora_alpha': 32, 'lora_dropout': 0.05, 'fan_in_fan_out': False, 'bias': 'none', 'use_rslora': False, 'modules_to_save': [], 'init_lora_weights': True, 'layers_to_transform': None, 'layers_pattern': None, 'rank_pattern': {}, 'alpha_pattern': {}, 'megatron_config': None, 'megatron_core': 'megatron.core', 'trainable_token_indices': None, 'loftq_config': {}, 'eva_config': None, 'corda_config': None, 'use_dora': False, 'alora_invocation_tokens': None, 'use_qalora': False, 'qalora_group_size': 16, 'layer_replication': None, 'runtime_config': {'ephemeral_gpu_offload': False}, 'lora_bias': False, 'target_parameters': None, 'arrow_config': None, 'ensure_weight_tying': False, 'lora_dtype': None, 'lorap_lr_ratio': None, 'lorap_emb_lr': 1e-06}}, 'return_dict': True, 'output_hidden_states': False, 'torchscript': False, 'dtype': 'bfloat16', 'pruned_heads': {}, 'tie_word_embeddings': True, 'chunk_size_feed_forward': 0, 'is_encoder_decoder': False, 'is_decoder': False, 'cross_attention_hidden_size': None, 'add_cross_attention': False, 'tie_encoder_decoder': False, 'architectures': ['Qwen3ASRForConditionalGeneration'], 'finetuning_task': None, 'id2label': {0: 'LABEL_0', 1: 'LABEL_1'}, 'label2id': {'LABEL_0': 0, 'LABEL_1': 1}, 'task_specific_params': None, 'problem_type': None, 'tokenizer_class': None, 'prefix': None, 'bos_token_id': None, 'pad_token_id': 151643, 'eos_token_id': 151645, 'sep_token_id': None, 'decoder_start_token_id': None, 'max_length': 20, 'min_length': 0, 'do_sample': False, 'early_stopping': False, 'num_beams': 1, 'temperature': 0.5, 'top_k': 50, 'top_p': 0.95, 'typical_p': 1.0, 'repetition_penalty': 1.08, 'length_penalty': 1.0, 'no_repeat_ngram_size': 0, 'encoder_no_repeat_ngram_size': 0, 'bad_words_ids': None, 'num_return_sequences': 1, 'output_scores': False, 'return_dict_in_generate': False, 'forced_bos_token_id': None, 'forced_eos_token_id': None, 'remove_invalid_values': False, 'exponential_decay_length_penalty': None, 'suppress_tokens': None, 'begin_suppress_tokens': None, 'num_beam_groups': 1, 'diversity_penalty': 0.0, '_name_or_path': '/mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/qwen3-asr-merged', 'transformers_version': '4.57.6', 'model_type': 'qwen3_asr', 'tf_legacy_loss': False, 'use_bfloat16': False, 'thinker_config': {'return_dict': True, 'output_hidden_states': False, 'torchscript': False, 'dtype': 'bfloat16', 'pruned_heads': {}, 'tie_word_embeddings': True, 'chunk_size_feed_forward': 0, 'is_encoder_decoder': False, 'is_decoder': False, 'cross_attention_hidden_size': None, 'add_cross_attention': False, 'tie_encoder_decoder': False, 'architectures': ['Qwen3ASRForConditionalGeneration'], 'finetuning_task': None, 'id2label': {0: 'LABEL_0', 1: 'LABEL_1'}, 'label2id': {'LABEL_0': 0, 'LABEL_1': 1}, 'task_specific_params': None, 'problem_type': None, 'tokenizer_class': None, 'prefix': None, 'bos_token_id': None, 'pad_token_id': None, 'eos_token_id': None, 'sep_token_id': None, 'decoder_start_token_id': None, 'max_length': 20, 'min_length': 0, 'do_sample': False, 'early_stopping': False, 'num_beams': 1, 'temperature': 1.0, 'top_k': 50, 'top_p': 1.0, 'typical_p': 1.0, 'repetition_penalty': 1.0, 'length_penalty': 1.0, 'no_repeat_ngram_size': 0, 'encoder_no_repeat_ngram_size': 0, 'bad_words_ids': None, 'num_return_sequences': 1, 'output_scores': False, 'return_dict_in_generate': False, 'forced_bos_token_id': None, 'forced_eos_token_id': None, 'remove_invalid_values': False, 'exponential_decay_length_penalty': None, 'suppress_tokens': None, 'begin_suppress_tokens': None, 'num_beam_groups': 1, 'diversity_penalty': 0.0, '_name_or_path': '', 'audio_end_token_id': 151670, 'model_type': 'qwen3_asr_thinker', 'tf_legacy_loss': False, 'use_bfloat16': False, 'user_token_id': 872, 'audio_start_token_id': 151669, 'initializer_range': 0.02, 'audio_config': {'return_dict': True, 'output_hidden_states': False, 'torchscript': False, 'dtype': None, 'pruned_heads': {}, 'tie_word_embeddings': True, 'chunk_size_feed_forward': 0, 'is_encoder_decoder': False, 'is_decoder': False, 'cross_attention_hidden_size': None, 'add_cross_attention': False, 'tie_encoder_decoder': False, 'architectures': None, 'finetuning_task': None, 'id2label': {0: 'LABEL_0', 1: 'LABEL_1'}, 'label2id': {'LABEL_0': 0, 'LABEL_1': 1}, 'task_specific_params': None, 'problem_type': None, 'tokenizer_class': None, 'prefix': None, 'bos_token_id': None, 'pad_token_id': None, 'eos_token_id': None, 'sep_token_id': None, 'decoder_start_token_id': None, 'max_length': 20, 'min_length': 0, 'do_sample': False, 'early_stopping': False, 'num_beams': 1, 'temperature': 1.0, 'top_k': 50, 'top_p': 1.0, 'typical_p': 1.0, 'repetition_penalty': 1.0, 'length_penalty': 1.0, 'no_repeat_ngram_size': 0, 'encoder_no_repeat_ngram_size': 0, 'bad_words_ids': None, 'num_return_sequences': 1, 'output_scores': False, 'return_dict_in_generate': False, 'forced_bos_token_id': None, 'forced_eos_token_id': None, 'remove_invalid_values': False, 'exponential_decay_length_penalty': None, 'suppress_tokens': None, 'begin_suppress_tokens': None, 'num_beam_groups': 1, 'diversity_penalty': 0.0, '_name_or_path': '', 'model_type': 'qwen3_asr_audio_encoder', 'num_hidden_layers': 24, 'tf_legacy_loss': False, 'use_bfloat16': False, 'num_mel_bins': 128, 'd_model': 1024, 'encoder_layers': 24, 'encoder_attention_heads': 16, 'encoder_ffn_dim': 4096, 'dropout': 0, 'attention_dropout': 0, 'activation_function': 'gelu', 'activation_dropout': 0, 'initializer_range': 0.02, 'scale_embedding': False, 'max_source_positions': 1500, 'n_window': 50, 'output_dim': 2048, 'n_window_infer': 800, 'conv_chunksize': 500, 'downsample_hidden_size': 480, 'output_attentions': False}, 'text_config': {'vocab_size': 151936, 'max_position_embeddings': 65536, 'hidden_size': 2048, 'intermediate_size': 6144, 'num_hidden_layers': 28, 'num_attention_heads': 16, 'num_key_value_heads': 8, 'head_dim': 128, 'hidden_act': 'silu', 'initializer_range': 0.02, 'rms_norm_eps': 1e-06, 'use_cache': False, 'rope_theta': 1000000, 'rope_scaling': {'interleaved': True, 'mrope_interleaved': True, 'mrope_section': [24, 20, 20], 'rope_type': 'default', 'type': 'default'}, 'attention_bias': False, 'attention_dropout': 0.0, 'return_dict': True, 'output_hidden_states': False, 'torchscript': False, 'dtype': None, 'pruned_heads': {}, 'tie_word_embeddings': True, 'chunk_size_feed_forward': 0, 'is_encoder_decoder': False, 'is_decoder': False, 'cross_attention_hidden_size': None, 'add_cross_attention': False, 'tie_encoder_decoder': False, 'architectures': None, 'finetuning_task': None, 'id2label': {0: 'LABEL_0', 1: 'LABEL_1'}, 'label2id': {'LABEL_0': 0, 'LABEL_1': 1}, 'task_specific_params': None, 'problem_type': None, 'tokenizer_class': None, 'prefix': None, 'bos_token_id': None, 'pad_token_id': 151643, 'eos_token_id': None, 'sep_token_id': None, 'decoder_start_token_id': None, 'max_length': 20, 'min_length': 0, 'do_sample': False, 'early_stopping': False, 'num_beams': 1, 'temperature': 1.0, 'top_k': 50, 'top_p': 1.0, 'typical_p': 1.0, 'repetition_penalty': 1.0, 'length_penalty': 1.0, 'no_repeat_ngram_size': 0, 'encoder_no_repeat_ngram_size': 0, 'bad_words_ids': None, 'num_return_sequences': 1, 'output_scores': False, 'return_dict_in_generate': False, 'forced_bos_token_id': None, 'forced_eos_token_id': None, 'remove_invalid_values': False, 'exponential_decay_length_penalty': None, 'suppress_tokens': None, 'begin_suppress_tokens': None, 'num_beam_groups': 1, 'diversity_penalty': 0.0, '_name_or_path': '', 'model_type': 'qwen3_asr_text', 'tf_legacy_loss': False, 'use_bfloat16': False, 'output_attentions': False}, 'audio_token_id': 151676, 'output_attentions': False}, 'support_languages': ['Chinese', 'English', 'Cantonese', 'Arabic', 'German', 'French', 'Spanish', 'Portuguese', 'Indonesian', 'Italian', 'Korean', 'Russian', 'Thai', 'Vietnamese', 'Japanese', 'Turkish', 'Hindi', 'Malay', 'Dutch', 'Swedish', 'Danish', 'Finnish', 'Polish', 'Czech', 'Filipino', 'Persian', 'Greek', 'Romanian', 'Hungarian', 'Macedonian'], 'output_attentions': False, 'output_dir': '/mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/0416upload/out/qwen3asr_dapo_reward56_4x4x12_12gen_4GPU/v4-20260417-125332', 'overwrite_output_dir': False, 'do_train': False, 'do_eval': True, 'do_predict': False, 'eval_strategy': 'steps', 'prediction_loss_only': False, 'per_device_train_batch_size': 4, 'per_device_eval_batch_size': 4, 'per_gpu_train_batch_size': None, 'per_gpu_eval_batch_size': None, 'gradient_accumulation_steps': 12, 'eval_accumulation_steps': None, 'eval_delay': 0, 'torch_empty_cache_steps': None, 'learning_rate': 5e-05, 'weight_decay': 0.1, 'adam_beta1': 0.9, 'adam_beta2': 0.95, 'adam_epsilon': 1e-08, 'max_grad_norm': 1.0, 'num_train_epochs': 3.0, 'max_steps': -1, 'lr_scheduler_type': 'cosine', 'lr_scheduler_kwargs': None, 'warmup_ratio': 0.03, 'warmup_steps': 0, 'log_level': 'passive', 'log_level_replica': 'warning', 'log_on_each_node': True, 'logging_dir': '/mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/0416upload/out/qwen3asr_dapo_reward56_4x4x12_12gen_4GPU/v4-20260417-125332/runs', 'logging_strategy': 'steps', 'logging_first_step': True, 'logging_steps': 5, 'logging_nan_inf_filter': True, 'save_strategy': 'steps', 'save_steps': 20, 'save_total_limit': None, 'save_safetensors': True, 'save_on_each_node': False, 'save_only_model': False, 'restore_callback_states_from_checkpoint': False, 'no_cuda': False, 'use_cpu': False, 'use_mps_device': False, 'seed': 42, 'data_seed': 42, 'jit_mode_eval': False, 'bf16': True, 'fp16': False, 'fp16_opt_level': 'O1', 'half_precision_backend': 'auto', 'bf16_full_eval': False, 'fp16_full_eval': False, 'tf32': None, 'local_rank': 0, 'ddp_backend': None, 'tpu_num_cores': None, 'tpu_metrics_debug': False, 'debug': [], 'dataloader_drop_last': True, 'eval_steps': 20, 'dataloader_num_workers': 1, 'dataloader_prefetch_factor': 2, 'past_index': -1, 'run_name': 'qwen3asr_dapo_reward56_4x4x12_12gen_4GPU', 'disable_tqdm': False, 'remove_unused_columns': False, 'label_names': None, 'load_best_model_at_end': False, 'metric_for_best_model': 'loss', 'greater_is_better': False, 'ignore_data_skip': False, 'fsdp': [], 'fsdp_min_num_params': 0, 'fsdp_config': {'min_num_params': 0, 'xla': False, 'xla_fsdp_v2': False, 'xla_fsdp_grad_ckpt': False}, 'fsdp_transformer_layer_cls_to_wrap': None, 'accelerator_config': {'split_batches': False, 'dispatch_batches': False, 'even_batches': True, 'use_seedable_sampler': True, 'non_blocking': False, 'gradient_accumulation_kwargs': None}, 'parallelism_config': None, 'deepspeed': None, 'label_smoothing_factor': 0.0, 'optim': 'adamw_torch', 'optim_args': None, 'adafactor': False, 'group_by_length': False, 'length_column_name': 'length', 'report_to': ['wandb'], 'project': 'huggingface', 'trackio_space_id': 'trackio', 'ddp_find_unused_parameters': None, 'ddp_bucket_cap_mb': None, 'ddp_broadcast_buffers': None, 'dataloader_pin_memory': True, 'dataloader_persistent_workers': False, 'skip_memory_metrics': True, 'use_legacy_prediction_loop': False, 'push_to_hub': False, 'resume_from_checkpoint': None, 'hub_model_id': None, 'hub_strategy': 'every_save', 'hub_token': '<HUB_TOKEN>', 'hub_private_repo': None, 'hub_always_push': False, 'hub_revision': None, 'gradient_checkpointing': False, 'gradient_checkpointing_kwargs': None, 'include_inputs_for_metrics': False, 'include_for_metrics': [], 'eval_do_concat_batches': True, 'fp16_backend': 'auto', 'push_to_hub_model_id': None, 'push_to_hub_organization': None, 'push_to_hub_token': '<PUSH_TO_HUB_TOKEN>', 'mp_parameters': '', 'auto_find_batch_size': False, 'full_determinism': False, 'torchdynamo': None, 'ray_scope': 'last', 'ddp_timeout': 18000000, 'torch_compile': False, 'torch_compile_backend': None, 'torch_compile_mode': None, 'include_tokens_per_second': False, 'include_num_input_tokens_seen': 'no', 'neftune_noise_alpha': None, 'optim_target_modules': None, 'batch_eval_metrics': False, 'eval_on_start': False, 'use_liger_kernel': False, 'liger_kernel_config': None, 'eval_use_gather_object': False, 'average_tokens_across_devices': True, 'model_init_kwargs': None, 'disable_dropout': False, 'cast_lm_head_to_fp32': False, 'num_generations': 12, 'num_generations_eval': 4, 'max_completion_length': 256, 'ds3_gather_for_generation': True, 'shuffle_dataset': True, 'generation_batch_size': 48, 'steps_per_generation': 3, 'min_p': None, 'generation_kwargs': None, 'chat_template_kwargs': None, 'use_transformers_paged': False, 'cache_implementation': None, 'use_vllm': False, 'vllm_mode': None, 'vllm_model_impl': 'vllm', 'vllm_enable_sleep_mode': False, 'vllm_structured_outputs_regex': None, 'vllm_server_base_url': None, 'vllm_server_host': None, 'vllm_server_port': [8000], 'vllm_server_timeout': 240.0, 'vllm_group_port': 51216, 'vllm_gpu_memory_utilization': 0.9, 'vllm_max_model_length': None, 'vllm_tensor_parallel_size': 1, 'beta': 0.04, 'num_iterations': 2, 'epsilon': 0.2, 'delta': None, 'epsilon_high': 0.28, 'sapo_temperature_neg': 1.05, 'sapo_temperature_pos': 1.0, 'importance_sampling_level': 'token', 'reward_weights': None, 'multi_objective_aggregation': 'sum_then_normalize', 'scale_rewards': 'group', 'loss_type': 'dapo', 'mask_truncated_completions': False, 'sync_ref_model': False, 'ref_model_mixup_alpha': 0.6, 'ref_model_sync_steps': 512, 'top_entropy_quantile': 1.0, 'max_tool_calling_iterations': None, 'vllm_importance_sampling_correction': True, 'vllm_importance_sampling_mode': 'sequence_mask', 'vllm_importance_sampling_cap': 3.0, 'off_policy_mask_threshold': None, 'use_bias_correction_kl': False, 'log_completions': True, 'num_completions_to_print': None, 'log_unique_prompts': False, 'log_completions_hub_repo': None, 'tuner_backend': 'peft', 'vit_gradient_checkpointing': True, 'router_aux_loss_coef': 0.0, 'enable_dft_loss': False, 'enable_channel_loss': False, 'safe_serialization': True, 'max_shard_size': '5GB', 'check_model': True, 'acc_strategy': 'token', 'train_dataloader_shuffle': True, 'max_epochs': None, 'aligner_lr': None, 'vit_lr': None, 'use_logits_to_keep': None, 'resume_only_model': False, 'optimizer': None, 'eval_metric': None, 'callbacks': [], 'early_stop_interval': None, 'eval_use_evalscope': False, 'eval_dataset': [], 'eval_dataset_args': None, 'eval_limit': None, 'eval_generation_config': None, 'extra_eval_args': None, 'tuner_type': 'lora', 'use_galore': False, 'galore_target_modules': None, 'galore_rank': 128, 'galore_update_proj_gap': 50, 'galore_scale': 1.0, 'galore_proj_type': 'std', 'galore_optim_per_parameter': False, 'galore_with_embedding': False, 'galore_quantization': False, 'galore_proj_quant': False, 'galore_proj_bits': 4, 'galore_proj_group_size': 256, 'galore_cos_threshold': 0.4, 'galore_gamma_proj': 2, 'galore_queue_size': 5, 'lisa_activated_layers': 0, 'lisa_step_interval': 20, 'use_flash_ckpt': False, 'vllm_pipeline_parallel_size': 1, 'vllm_enable_expert_parallel': False, 'vllm_max_num_seqs': None, 'vllm_max_model_len': None, 'vllm_disable_custom_all_reduce': True, 'vllm_enforce_eager': False, 'vllm_limit_mm_per_prompt': None, 'vllm_max_lora_rank': 16, 'vllm_enable_prefix_caching': True, 'vllm_use_async_engine': None, 'vllm_quantization': None, 'vllm_reasoning_parser': None, 'vllm_disable_cascade_attn': False, 'vllm_mm_processor_cache_gb': None, 'vllm_speculative_config': None, 'vllm_engine_kwargs': {}, 'vllm_data_parallel_size': 1, 'stop_words': [], 'vllm_enable_lora': False, 'lora_rank': 8, 'vllm_server_group_port': None, 'enable_flattened_weight_sync': True, 'async_generate': False, 'structured_outputs_regex': None, 'sleep_level': 0, 'move_model_batches': None, 'offload_optimizer': False, 'offload_model': False, 'wandb_log_unique_prompts': None, 'cosine_min_len_value_wrong': -0.5, 'cosine_max_len_value_wrong': 0.0, 'cosine_min_len_value_correct': 1.0, 'cosine_max_len_value_correct': 0.5, 'cosine_max_len': 256, 'repetition_n_grams': 3, 'repetition_max_penalty': -1.0, 'reward_model': None, 'reward_model_plugin': None, 'chord_sft_dataset': [], 'chord_sft_per_device_train_batch_size': None, 'chord_enable_phi_function': False, 'chord_mu_warmup_steps': None, 'chord_mu_decay_steps': None, 'chord_mu_peak': None, 'chord_mu_valley': None, 'multi_turn_scheduler': None, 'max_turns': None, 'completion_length_limit_scope': 'per_round', 'vllm_server_pass_dataset': False, 'dynamic_sample': True, 'max_resample_times': 4, 'overlong_filter': True, 'soft_max_length': None, 'soft_cache_length': None, 'log_entropy': False, 'tau_pos': 1.0, 'tau_neg': 1.05, 'advantage_estimator': 'grpo', 'kl_in_reward': False, 'dataset_shuffle': True, 'rollout_importance_sampling_mode': None, 'rollout_importance_sampling_threshold': 2.0, 'log_rollout_offpolicy_metrics': False, 'off_policy_sequence_mask_delta': None}
23
+ 2026-04-17 12:53:51,543 INFO MainThread:255159 [wandb_config.py:__setitem__():154] [no run ID] config set model/num_parameters = 2050307712 - <bound method Run._config_callback of <wandb.sdk.wandb_run.Run object at 0x7fca74e06a70>>
24
+ 2026-04-17 12:53:51,543 INFO MainThread:255159 [wandb_run.py:_config_callback():1385] config_cb model/num_parameters 2050307712 None
25
+ 2026-04-17 13:03:10,120 INFO wandb-AsyncioManager-main:255159 [service_client.py:_forward_responses():80] Reached EOF.
26
+ 2026-04-17 13:03:10,120 INFO wandb-AsyncioManager-main:255159 [mailbox.py:close():137] Closing mailbox, abandoning 1 handles.
wandb/run-20260418_172847-c2a5hfz3/files/config.yaml ADDED
@@ -0,0 +1,1262 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ _name_or_path:
2
+ value: /mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/qwen3-asr-merged
3
+ _wandb:
4
+ value:
5
+ cli_version: 0.23.0
6
+ e:
7
+ ess1zs9oqcfvbaak4xbqvnst142xqp1g:
8
+ args:
9
+ - --rlhf_type
10
+ - grpo
11
+ - --external_plugins
12
+ - /mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/0416upload/my_qwen3_asr_dapo_register.py
13
+ - /mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/0416upload/0417_reward.py
14
+ - --model
15
+ - /mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/qwen3-asr-merged
16
+ - --model_type
17
+ - my_qwen3_asr_rl
18
+ - --template
19
+ - my_qwen3_asr_rl
20
+ - --dataset
21
+ - /mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/0416upload/lora_0323_10w+55w+error+syn_with_domain_train90_targeted_rl_train90_loramerged_basewer_3suppress_server.jsonl
22
+ - --val_dataset
23
+ - /mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/0416upload/lora_0323_10w+55w+error+syn_with_domain_train90_targeted_rl_val5_sample5p_server.jsonl
24
+ - --reward_funcs
25
+ - asr_wer_sub_len_cmp_hallu_dirty_v56
26
+ - --train_type
27
+ - lora
28
+ - --use_vllm
29
+ - "false"
30
+ - --log_completions
31
+ - "true"
32
+ - --loss_type
33
+ - dapo
34
+ - --advantage_estimator
35
+ - grpo
36
+ - --scale_rewards
37
+ - group
38
+ - --num_iterations
39
+ - "2"
40
+ - --beta
41
+ - "0.04"
42
+ - --epsilon_high
43
+ - "0.28"
44
+ - --dynamic_sample
45
+ - "true"
46
+ - --max_resample_times
47
+ - "4"
48
+ - --overlong_filter
49
+ - "true"
50
+ - --truncation_strategy
51
+ - delete
52
+ - --num_generations
53
+ - "12"
54
+ - --generation_batch_size
55
+ - "48"
56
+ - --per_device_train_batch_size
57
+ - "4"
58
+ - --per_device_eval_batch_size
59
+ - "4"
60
+ - --gradient_accumulation_steps
61
+ - "12"
62
+ - --num_generations_eval
63
+ - "4"
64
+ - --max_completion_length
65
+ - "256"
66
+ - --temperature
67
+ - "0.50"
68
+ - --top_p
69
+ - "0.95"
70
+ - --top_k
71
+ - "50"
72
+ - --repetition_penalty
73
+ - "1.08"
74
+ - --learning_rate
75
+ - "5e-5"
76
+ - --lr_scheduler_type
77
+ - cosine
78
+ - --warmup_ratio
79
+ - "0.03"
80
+ - --report_to
81
+ - wandb
82
+ - --run_name
83
+ - qwen3asr_dapo_reward56_4x4x12_12gen_4GPU
84
+ - --output_dir
85
+ - /mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/0416upload/out/qwen3asr_dapo_reward56_4x4x12_12gen_4GPU
86
+ - --save_strategy
87
+ - steps
88
+ - --save_steps
89
+ - "20"
90
+ - --logging_steps
91
+ - "5"
92
+ - --freeze_llm
93
+ - "false"
94
+ - --freeze_vit
95
+ - "false"
96
+ - --freeze_aligner
97
+ - "false"
98
+ - --remove_unused_columns
99
+ - "false"
100
+ - --padding_side
101
+ - left
102
+ cpu_count: 64
103
+ cpu_count_logical: 128
104
+ cudaVersion: "12.4"
105
+ disk:
106
+ /:
107
+ total: "524945911808"
108
+ used: "37368901632"
109
+ email: pang_kaiyu@163.com
110
+ executable: /mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/bin/python3.10
111
+ gpu: NVIDIA A100-SXM4-80GB
112
+ gpu_count: 8
113
+ gpu_nvidia:
114
+ - architecture: Ampere
115
+ cudaCores: 6912
116
+ memoryTotal: "85899345920"
117
+ name: NVIDIA A100-SXM4-80GB
118
+ uuid: GPU-87e7e3ab-b254-fc22-7407-8e2e88e9d854
119
+ - architecture: Ampere
120
+ cudaCores: 6912
121
+ memoryTotal: "85899345920"
122
+ name: NVIDIA A100-SXM4-80GB
123
+ uuid: GPU-976db8a1-cf00-11c6-caaa-413862233fd4
124
+ - architecture: Ampere
125
+ cudaCores: 6912
126
+ memoryTotal: "85899345920"
127
+ name: NVIDIA A100-SXM4-80GB
128
+ uuid: GPU-78b37ae8-44e0-e318-a6c0-f6f4ac78d46a
129
+ - architecture: Ampere
130
+ cudaCores: 6912
131
+ memoryTotal: "85899345920"
132
+ name: NVIDIA A100-SXM4-80GB
133
+ uuid: GPU-840b937d-a7d4-68e7-ad57-f4568e01c3ae
134
+ - architecture: Ampere
135
+ cudaCores: 6912
136
+ memoryTotal: "85899345920"
137
+ name: NVIDIA A100-SXM4-80GB
138
+ uuid: GPU-a9d0de54-f5b5-f83b-7bda-f53db844622d
139
+ - architecture: Ampere
140
+ cudaCores: 6912
141
+ memoryTotal: "85899345920"
142
+ name: NVIDIA A100-SXM4-80GB
143
+ uuid: GPU-cb7d22e9-305c-c68c-64f1-599580742db0
144
+ - architecture: Ampere
145
+ cudaCores: 6912
146
+ memoryTotal: "85899345920"
147
+ name: NVIDIA A100-SXM4-80GB
148
+ uuid: GPU-8d9704bb-4592-346f-a7f2-1a6ed8d58619
149
+ - architecture: Ampere
150
+ cudaCores: 6912
151
+ memoryTotal: "85899345920"
152
+ name: NVIDIA A100-SXM4-80GB
153
+ uuid: GPU-3892f01b-e0b8-a9d9-0587-b5a7d2d9b5ab
154
+ host: SH-IDC1-10-140-37-95
155
+ memory:
156
+ total: "1081627828224"
157
+ os: Linux-3.10.0-957.el7.x86_64-x86_64-with-glibc2.17
158
+ program: /mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/lib/python3.10/site-packages/swift/cli/rlhf.py
159
+ python: CPython 3.10.18
160
+ root: /mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/0416upload
161
+ slurm:
162
+ cluster_name: cluster_sproject3
163
+ conf: /etc/slurm/slurm.conf
164
+ cpus_on_node: "2"
165
+ gtids: "0"
166
+ job_account: research
167
+ job_cpus_per_node: "2"
168
+ job_gid: "800000689"
169
+ job_gpus: 0,1,2,6
170
+ job_id: "8574598"
171
+ job_name: qwen3_asr_train_4gpu
172
+ job_nodelist: SH-IDC1-10-140-37-95
173
+ job_num_nodes: "1"
174
+ job_partition: interntmp
175
+ job_qos: normal
176
+ job_uid: "800000689"
177
+ job_user: panjiabao
178
+ jobid: "8574598"
179
+ localid: "0"
180
+ nnodes: "1"
181
+ node_aliases: (null)
182
+ nodeid: "0"
183
+ nodelist: SH-IDC1-10-140-37-95
184
+ nprocs: "1"
185
+ ntasks: "1"
186
+ prio_process: "0"
187
+ procid: "0"
188
+ submit_dir: /mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/0416upload
189
+ submit_host: SH-IDC1-10-140-37-164
190
+ task_pid: "9466"
191
+ tasks_per_node: "1"
192
+ topology_addr: SH-IDC1-10-140-37-95
193
+ topology_addr_pattern: node
194
+ working_cluster: cluster_sproject3:SH-IDC1-10-140-37-161:6817:9216:109
195
+ startedAt: "2026-04-18T09:28:47.432340Z"
196
+ writerId: ess1zs9oqcfvbaak4xbqvnst142xqp1g
197
+ m:
198
+ - "1": train/global_step
199
+ "6":
200
+ - 3
201
+ "7": []
202
+ - "2": '*'
203
+ "5": 1
204
+ "6":
205
+ - 1
206
+ "7": []
207
+ python_version: 3.10.18
208
+ t:
209
+ "1":
210
+ - 1
211
+ - 5
212
+ - 11
213
+ - 30
214
+ - 41
215
+ - 49
216
+ - 51
217
+ - 53
218
+ - 71
219
+ - 84
220
+ - 95
221
+ - 98
222
+ - 105
223
+ "2":
224
+ - 1
225
+ - 5
226
+ - 11
227
+ - 30
228
+ - 41
229
+ - 49
230
+ - 51
231
+ - 53
232
+ - 71
233
+ - 84
234
+ - 95
235
+ - 98
236
+ - 105
237
+ "3":
238
+ - 7
239
+ - 13
240
+ - 19
241
+ - 66
242
+ "4": 3.10.18
243
+ "5": 0.23.0
244
+ "6": 4.57.6
245
+ "9":
246
+ "1": transformers_trainer
247
+ "12": 0.23.0
248
+ "13": linux-x86_64
249
+ acc_strategy:
250
+ value: token
251
+ accelerator_config:
252
+ value:
253
+ dispatch_batches: false
254
+ even_batches: true
255
+ gradient_accumulation_kwargs: null
256
+ non_blocking: false
257
+ split_batches: false
258
+ use_seedable_sampler: true
259
+ adafactor:
260
+ value: false
261
+ adam_beta1:
262
+ value: 0.9
263
+ adam_beta2:
264
+ value: 0.95
265
+ adam_epsilon:
266
+ value: 1e-08
267
+ add_cross_attention:
268
+ value: false
269
+ advantage_estimator:
270
+ value: grpo
271
+ aligner_lr:
272
+ value: null
273
+ architectures:
274
+ value:
275
+ - Qwen3ASRForConditionalGeneration
276
+ async_generate:
277
+ value: false
278
+ auto_find_batch_size:
279
+ value: false
280
+ average_tokens_across_devices:
281
+ value: true
282
+ bad_words_ids:
283
+ value: null
284
+ batch_eval_metrics:
285
+ value: false
286
+ begin_suppress_tokens:
287
+ value: null
288
+ beta:
289
+ value: 0.04
290
+ bf16:
291
+ value: true
292
+ bf16_full_eval:
293
+ value: false
294
+ bos_token_id:
295
+ value: null
296
+ cache_implementation:
297
+ value: null
298
+ callbacks:
299
+ value: []
300
+ cast_lm_head_to_fp32:
301
+ value: false
302
+ chat_template_kwargs:
303
+ value: null
304
+ check_model:
305
+ value: true
306
+ chord_enable_phi_function:
307
+ value: false
308
+ chord_mu_decay_steps:
309
+ value: null
310
+ chord_mu_peak:
311
+ value: null
312
+ chord_mu_valley:
313
+ value: null
314
+ chord_mu_warmup_steps:
315
+ value: null
316
+ chord_sft_dataset:
317
+ value: []
318
+ chord_sft_per_device_train_batch_size:
319
+ value: null
320
+ chunk_size_feed_forward:
321
+ value: 0
322
+ completion_length_limit_scope:
323
+ value: per_round
324
+ cosine_max_len:
325
+ value: 256
326
+ cosine_max_len_value_correct:
327
+ value: 0.5
328
+ cosine_max_len_value_wrong:
329
+ value: 0
330
+ cosine_min_len_value_correct:
331
+ value: 1
332
+ cosine_min_len_value_wrong:
333
+ value: -0.5
334
+ cross_attention_hidden_size:
335
+ value: null
336
+ data_seed:
337
+ value: 42
338
+ dataloader_drop_last:
339
+ value: true
340
+ dataloader_num_workers:
341
+ value: 1
342
+ dataloader_persistent_workers:
343
+ value: false
344
+ dataloader_pin_memory:
345
+ value: true
346
+ dataloader_prefetch_factor:
347
+ value: 2
348
+ dataset_shuffle:
349
+ value: true
350
+ ddp_backend:
351
+ value: null
352
+ ddp_broadcast_buffers:
353
+ value: null
354
+ ddp_bucket_cap_mb:
355
+ value: null
356
+ ddp_find_unused_parameters:
357
+ value: null
358
+ ddp_timeout:
359
+ value: 18000000
360
+ debug:
361
+ value: []
362
+ decoder_start_token_id:
363
+ value: null
364
+ deepspeed:
365
+ value: null
366
+ delta:
367
+ value: null
368
+ disable_dropout:
369
+ value: false
370
+ disable_tqdm:
371
+ value: false
372
+ diversity_penalty:
373
+ value: 0
374
+ do_eval:
375
+ value: true
376
+ do_predict:
377
+ value: false
378
+ do_sample:
379
+ value: false
380
+ do_train:
381
+ value: false
382
+ ds3_gather_for_generation:
383
+ value: true
384
+ dtype:
385
+ value: bfloat16
386
+ dynamic_sample:
387
+ value: true
388
+ early_stop_interval:
389
+ value: null
390
+ early_stopping:
391
+ value: false
392
+ enable_channel_loss:
393
+ value: false
394
+ enable_dft_loss:
395
+ value: false
396
+ enable_flattened_weight_sync:
397
+ value: true
398
+ encoder_no_repeat_ngram_size:
399
+ value: 0
400
+ eos_token_id:
401
+ value: 151645
402
+ epsilon:
403
+ value: 0.2
404
+ epsilon_high:
405
+ value: 0.28
406
+ eval_accumulation_steps:
407
+ value: null
408
+ eval_dataset:
409
+ value: []
410
+ eval_dataset_args:
411
+ value: null
412
+ eval_delay:
413
+ value: 0
414
+ eval_do_concat_batches:
415
+ value: true
416
+ eval_generation_config:
417
+ value: null
418
+ eval_limit:
419
+ value: null
420
+ eval_metric:
421
+ value: null
422
+ eval_on_start:
423
+ value: false
424
+ eval_steps:
425
+ value: 20
426
+ eval_strategy:
427
+ value: steps
428
+ eval_use_evalscope:
429
+ value: false
430
+ eval_use_gather_object:
431
+ value: false
432
+ exponential_decay_length_penalty:
433
+ value: null
434
+ extra_eval_args:
435
+ value: null
436
+ finetuning_task:
437
+ value: null
438
+ forced_bos_token_id:
439
+ value: null
440
+ forced_eos_token_id:
441
+ value: null
442
+ fp16:
443
+ value: false
444
+ fp16_backend:
445
+ value: auto
446
+ fp16_full_eval:
447
+ value: false
448
+ fp16_opt_level:
449
+ value: O1
450
+ fsdp:
451
+ value: []
452
+ fsdp_config:
453
+ value:
454
+ min_num_params: 0
455
+ xla: false
456
+ xla_fsdp_grad_ckpt: false
457
+ xla_fsdp_v2: false
458
+ fsdp_min_num_params:
459
+ value: 0
460
+ fsdp_transformer_layer_cls_to_wrap:
461
+ value: null
462
+ full_determinism:
463
+ value: false
464
+ galore_cos_threshold:
465
+ value: 0.4
466
+ galore_gamma_proj:
467
+ value: 2
468
+ galore_optim_per_parameter:
469
+ value: false
470
+ galore_proj_bits:
471
+ value: 4
472
+ galore_proj_group_size:
473
+ value: 256
474
+ galore_proj_quant:
475
+ value: false
476
+ galore_proj_type:
477
+ value: std
478
+ galore_quantization:
479
+ value: false
480
+ galore_queue_size:
481
+ value: 5
482
+ galore_rank:
483
+ value: 128
484
+ galore_scale:
485
+ value: 1
486
+ galore_target_modules:
487
+ value: null
488
+ galore_update_proj_gap:
489
+ value: 50
490
+ galore_with_embedding:
491
+ value: false
492
+ generation_batch_size:
493
+ value: 48
494
+ generation_kwargs:
495
+ value: null
496
+ gradient_accumulation_steps:
497
+ value: 12
498
+ gradient_checkpointing:
499
+ value: false
500
+ gradient_checkpointing_kwargs:
501
+ value: null
502
+ greater_is_better:
503
+ value: false
504
+ group_by_length:
505
+ value: false
506
+ half_precision_backend:
507
+ value: auto
508
+ hub_always_push:
509
+ value: false
510
+ hub_model_id:
511
+ value: null
512
+ hub_private_repo:
513
+ value: null
514
+ hub_revision:
515
+ value: null
516
+ hub_strategy:
517
+ value: every_save
518
+ hub_token:
519
+ value: <HUB_TOKEN>
520
+ id2label:
521
+ value:
522
+ "0": LABEL_0
523
+ "1": LABEL_1
524
+ ignore_data_skip:
525
+ value: false
526
+ importance_sampling_level:
527
+ value: token
528
+ include_for_metrics:
529
+ value: []
530
+ include_inputs_for_metrics:
531
+ value: false
532
+ include_num_input_tokens_seen:
533
+ value: "no"
534
+ include_tokens_per_second:
535
+ value: false
536
+ is_decoder:
537
+ value: false
538
+ is_encoder_decoder:
539
+ value: false
540
+ jit_mode_eval:
541
+ value: false
542
+ kl_in_reward:
543
+ value: false
544
+ label_names:
545
+ value: null
546
+ label_smoothing_factor:
547
+ value: 0
548
+ label2id:
549
+ value:
550
+ LABEL_0: 0
551
+ LABEL_1: 1
552
+ learning_rate:
553
+ value: 5e-05
554
+ length_column_name:
555
+ value: length
556
+ length_penalty:
557
+ value: 1
558
+ liger_kernel_config:
559
+ value: null
560
+ lisa_activated_layers:
561
+ value: 0
562
+ lisa_step_interval:
563
+ value: 20
564
+ load_best_model_at_end:
565
+ value: false
566
+ local_rank:
567
+ value: 0
568
+ log_completions:
569
+ value: true
570
+ log_completions_hub_repo:
571
+ value: null
572
+ log_entropy:
573
+ value: false
574
+ log_level:
575
+ value: passive
576
+ log_level_replica:
577
+ value: warning
578
+ log_on_each_node:
579
+ value: true
580
+ log_rollout_offpolicy_metrics:
581
+ value: false
582
+ log_unique_prompts:
583
+ value: false
584
+ logging_dir:
585
+ value: /mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/0416upload/out/qwen3asr_dapo_reward56_4x4x12_12gen_4GPU/v5-20260418-172837/runs
586
+ logging_first_step:
587
+ value: true
588
+ logging_nan_inf_filter:
589
+ value: true
590
+ logging_steps:
591
+ value: 5
592
+ logging_strategy:
593
+ value: steps
594
+ lora_rank:
595
+ value: 8
596
+ loss_type:
597
+ value: dapo
598
+ lr_scheduler_kwargs:
599
+ value: null
600
+ lr_scheduler_type:
601
+ value: cosine
602
+ mask_truncated_completions:
603
+ value: false
604
+ max_completion_length:
605
+ value: 256
606
+ max_epochs:
607
+ value: null
608
+ max_grad_norm:
609
+ value: 1
610
+ max_length:
611
+ value: 20
612
+ max_resample_times:
613
+ value: 4
614
+ max_shard_size:
615
+ value: 5GB
616
+ max_steps:
617
+ value: -1
618
+ max_tool_calling_iterations:
619
+ value: null
620
+ max_turns:
621
+ value: null
622
+ metric_for_best_model:
623
+ value: loss
624
+ min_length:
625
+ value: 0
626
+ min_p:
627
+ value: null
628
+ model/num_parameters:
629
+ value: 2050307712
630
+ model_init_kwargs:
631
+ value: null
632
+ model_type:
633
+ value: qwen3_asr
634
+ move_model_batches:
635
+ value: null
636
+ mp_parameters:
637
+ value: ""
638
+ multi_objective_aggregation:
639
+ value: sum_then_normalize
640
+ multi_turn_scheduler:
641
+ value: null
642
+ neftune_noise_alpha:
643
+ value: null
644
+ no_cuda:
645
+ value: false
646
+ no_repeat_ngram_size:
647
+ value: 0
648
+ num_beam_groups:
649
+ value: 1
650
+ num_beams:
651
+ value: 1
652
+ num_completions_to_print:
653
+ value: null
654
+ num_generations:
655
+ value: 12
656
+ num_generations_eval:
657
+ value: 4
658
+ num_iterations:
659
+ value: 2
660
+ num_return_sequences:
661
+ value: 1
662
+ num_train_epochs:
663
+ value: 3
664
+ off_policy_mask_threshold:
665
+ value: null
666
+ off_policy_sequence_mask_delta:
667
+ value: null
668
+ offload_model:
669
+ value: false
670
+ offload_optimizer:
671
+ value: false
672
+ optim:
673
+ value: adamw_torch
674
+ optim_args:
675
+ value: null
676
+ optim_target_modules:
677
+ value: null
678
+ optimizer:
679
+ value: null
680
+ output_attentions:
681
+ value: false
682
+ output_dir:
683
+ value: /mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/0416upload/out/qwen3asr_dapo_reward56_4x4x12_12gen_4GPU/v5-20260418-172837
684
+ output_hidden_states:
685
+ value: false
686
+ output_scores:
687
+ value: false
688
+ overlong_filter:
689
+ value: true
690
+ overwrite_output_dir:
691
+ value: false
692
+ pad_token_id:
693
+ value: 151643
694
+ parallelism_config:
695
+ value: null
696
+ past_index:
697
+ value: -1
698
+ peft_config:
699
+ value:
700
+ default:
701
+ alora_invocation_tokens: null
702
+ arrow_config: null
703
+ auto_mapping: null
704
+ base_model_name_or_path: /mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/qwen3-asr-merged
705
+ bias: none
706
+ corda_config: null
707
+ ensure_weight_tying: false
708
+ eva_config: null
709
+ exclude_modules: null
710
+ fan_in_fan_out: false
711
+ inference_mode: false
712
+ init_lora_weights: true
713
+ layer_replication: null
714
+ layers_pattern: null
715
+ layers_to_transform: null
716
+ lora_alpha: 32
717
+ lora_bias: false
718
+ lora_dropout: 0.05
719
+ lora_dtype: null
720
+ lorap_emb_lr: 1e-06
721
+ lorap_lr_ratio: null
722
+ megatron_config: null
723
+ megatron_core: megatron.core
724
+ modules_to_save: []
725
+ peft_type: LORA
726
+ peft_version: 0.18.1
727
+ qalora_group_size: 16
728
+ r: 8
729
+ revision: null
730
+ runtime_config:
731
+ ephemeral_gpu_offload: false
732
+ target_modules: ^(thinker\.model(?=\.).*\.(up_proj|q_proj|o_proj|gate_proj|k_proj|v_proj|down_proj)|thinker\.audio_tower\.layers(?=\.).*\.(q_proj|fc1|out_proj|k_proj|v_proj|fc2)|thinker\.audio_tower\.conv_out(?=\.)|thinker\.audio_tower\.proj1(?=\.)|thinker\.audio_tower\.proj2(?=\.))$
733
+ target_parameters: null
734
+ task_type: CAUSAL_LM
735
+ trainable_token_indices: null
736
+ use_dora: false
737
+ use_qalora: false
738
+ use_rslora: false
739
+ per_device_eval_batch_size:
740
+ value: 4
741
+ per_device_train_batch_size:
742
+ value: 4
743
+ per_gpu_eval_batch_size:
744
+ value: null
745
+ per_gpu_train_batch_size:
746
+ value: null
747
+ prediction_loss_only:
748
+ value: false
749
+ prefix:
750
+ value: null
751
+ problem_type:
752
+ value: null
753
+ project:
754
+ value: huggingface
755
+ push_to_hub:
756
+ value: false
757
+ push_to_hub_model_id:
758
+ value: null
759
+ push_to_hub_organization:
760
+ value: null
761
+ push_to_hub_token:
762
+ value: <PUSH_TO_HUB_TOKEN>
763
+ ray_scope:
764
+ value: last
765
+ ref_model_mixup_alpha:
766
+ value: 0.6
767
+ ref_model_sync_steps:
768
+ value: 512
769
+ remove_invalid_values:
770
+ value: false
771
+ remove_unused_columns:
772
+ value: false
773
+ repetition_max_penalty:
774
+ value: -1
775
+ repetition_n_grams:
776
+ value: 3
777
+ repetition_penalty:
778
+ value: 1.08
779
+ report_to:
780
+ value:
781
+ - wandb
782
+ restore_callback_states_from_checkpoint:
783
+ value: false
784
+ resume_from_checkpoint:
785
+ value: null
786
+ resume_only_model:
787
+ value: false
788
+ return_dict:
789
+ value: true
790
+ return_dict_in_generate:
791
+ value: false
792
+ reward_model:
793
+ value: null
794
+ reward_model_plugin:
795
+ value: null
796
+ reward_weights:
797
+ value: null
798
+ rollout_importance_sampling_mode:
799
+ value: null
800
+ rollout_importance_sampling_threshold:
801
+ value: 2
802
+ router_aux_loss_coef:
803
+ value: 0
804
+ run_name:
805
+ value: qwen3asr_dapo_reward56_4x4x12_12gen_4GPU
806
+ safe_serialization:
807
+ value: true
808
+ sapo_temperature_neg:
809
+ value: 1.05
810
+ sapo_temperature_pos:
811
+ value: 1
812
+ save_on_each_node:
813
+ value: false
814
+ save_only_model:
815
+ value: false
816
+ save_safetensors:
817
+ value: true
818
+ save_steps:
819
+ value: 20
820
+ save_strategy:
821
+ value: steps
822
+ save_total_limit:
823
+ value: null
824
+ scale_rewards:
825
+ value: group
826
+ seed:
827
+ value: 42
828
+ sep_token_id:
829
+ value: null
830
+ shuffle_dataset:
831
+ value: true
832
+ skip_memory_metrics:
833
+ value: true
834
+ sleep_level:
835
+ value: 0
836
+ soft_cache_length:
837
+ value: null
838
+ soft_max_length:
839
+ value: null
840
+ steps_per_generation:
841
+ value: 3
842
+ stop_words:
843
+ value: []
844
+ structured_outputs_regex:
845
+ value: null
846
+ support_languages:
847
+ value:
848
+ - Chinese
849
+ - English
850
+ - Cantonese
851
+ - Arabic
852
+ - German
853
+ - French
854
+ - Spanish
855
+ - Portuguese
856
+ - Indonesian
857
+ - Italian
858
+ - Korean
859
+ - Russian
860
+ - Thai
861
+ - Vietnamese
862
+ - Japanese
863
+ - Turkish
864
+ - Hindi
865
+ - Malay
866
+ - Dutch
867
+ - Swedish
868
+ - Danish
869
+ - Finnish
870
+ - Polish
871
+ - Czech
872
+ - Filipino
873
+ - Persian
874
+ - Greek
875
+ - Romanian
876
+ - Hungarian
877
+ - Macedonian
878
+ suppress_tokens:
879
+ value: null
880
+ sync_ref_model:
881
+ value: false
882
+ task_specific_params:
883
+ value: null
884
+ tau_neg:
885
+ value: 1.05
886
+ tau_pos:
887
+ value: 1
888
+ temperature:
889
+ value: 0.5
890
+ tf_legacy_loss:
891
+ value: false
892
+ tf32:
893
+ value: null
894
+ thinker_config:
895
+ value:
896
+ _name_or_path: ""
897
+ add_cross_attention: false
898
+ architectures:
899
+ - Qwen3ASRForConditionalGeneration
900
+ audio_config:
901
+ _name_or_path: ""
902
+ activation_dropout: 0
903
+ activation_function: gelu
904
+ add_cross_attention: false
905
+ architectures: null
906
+ attention_dropout: 0
907
+ bad_words_ids: null
908
+ begin_suppress_tokens: null
909
+ bos_token_id: null
910
+ chunk_size_feed_forward: 0
911
+ conv_chunksize: 500
912
+ cross_attention_hidden_size: null
913
+ d_model: 1024
914
+ decoder_start_token_id: null
915
+ diversity_penalty: 0
916
+ do_sample: false
917
+ downsample_hidden_size: 480
918
+ dropout: 0
919
+ dtype: null
920
+ early_stopping: false
921
+ encoder_attention_heads: 16
922
+ encoder_ffn_dim: 4096
923
+ encoder_layers: 24
924
+ encoder_no_repeat_ngram_size: 0
925
+ eos_token_id: null
926
+ exponential_decay_length_penalty: null
927
+ finetuning_task: null
928
+ forced_bos_token_id: null
929
+ forced_eos_token_id: null
930
+ id2label:
931
+ "0": LABEL_0
932
+ "1": LABEL_1
933
+ initializer_range: 0.02
934
+ is_decoder: false
935
+ is_encoder_decoder: false
936
+ label2id:
937
+ LABEL_0: 0
938
+ LABEL_1: 1
939
+ length_penalty: 1
940
+ max_length: 20
941
+ max_source_positions: 1500
942
+ min_length: 0
943
+ model_type: qwen3_asr_audio_encoder
944
+ n_window: 50
945
+ n_window_infer: 800
946
+ no_repeat_ngram_size: 0
947
+ num_beam_groups: 1
948
+ num_beams: 1
949
+ num_hidden_layers: 24
950
+ num_mel_bins: 128
951
+ num_return_sequences: 1
952
+ output_attentions: false
953
+ output_dim: 2048
954
+ output_hidden_states: false
955
+ output_scores: false
956
+ pad_token_id: null
957
+ prefix: null
958
+ problem_type: null
959
+ remove_invalid_values: false
960
+ repetition_penalty: 1
961
+ return_dict: true
962
+ return_dict_in_generate: false
963
+ scale_embedding: false
964
+ sep_token_id: null
965
+ suppress_tokens: null
966
+ task_specific_params: null
967
+ temperature: 1
968
+ tf_legacy_loss: false
969
+ tie_encoder_decoder: false
970
+ tie_word_embeddings: true
971
+ tokenizer_class: null
972
+ top_k: 50
973
+ top_p: 1
974
+ torchscript: false
975
+ typical_p: 1
976
+ use_bfloat16: false
977
+ audio_end_token_id: 151670
978
+ audio_start_token_id: 151669
979
+ audio_token_id: 151676
980
+ bad_words_ids: null
981
+ begin_suppress_tokens: null
982
+ bos_token_id: null
983
+ chunk_size_feed_forward: 0
984
+ cross_attention_hidden_size: null
985
+ decoder_start_token_id: null
986
+ diversity_penalty: 0
987
+ do_sample: false
988
+ dtype: bfloat16
989
+ early_stopping: false
990
+ encoder_no_repeat_ngram_size: 0
991
+ eos_token_id: null
992
+ exponential_decay_length_penalty: null
993
+ finetuning_task: null
994
+ forced_bos_token_id: null
995
+ forced_eos_token_id: null
996
+ id2label:
997
+ "0": LABEL_0
998
+ "1": LABEL_1
999
+ initializer_range: 0.02
1000
+ is_decoder: false
1001
+ is_encoder_decoder: false
1002
+ label2id:
1003
+ LABEL_0: 0
1004
+ LABEL_1: 1
1005
+ length_penalty: 1
1006
+ max_length: 20
1007
+ min_length: 0
1008
+ model_type: qwen3_asr_thinker
1009
+ no_repeat_ngram_size: 0
1010
+ num_beam_groups: 1
1011
+ num_beams: 1
1012
+ num_return_sequences: 1
1013
+ output_attentions: false
1014
+ output_hidden_states: false
1015
+ output_scores: false
1016
+ pad_token_id: null
1017
+ prefix: null
1018
+ problem_type: null
1019
+ remove_invalid_values: false
1020
+ repetition_penalty: 1
1021
+ return_dict: true
1022
+ return_dict_in_generate: false
1023
+ sep_token_id: null
1024
+ suppress_tokens: null
1025
+ task_specific_params: null
1026
+ temperature: 1
1027
+ text_config:
1028
+ _name_or_path: ""
1029
+ add_cross_attention: false
1030
+ architectures: null
1031
+ attention_bias: false
1032
+ attention_dropout: 0
1033
+ bad_words_ids: null
1034
+ begin_suppress_tokens: null
1035
+ bos_token_id: null
1036
+ chunk_size_feed_forward: 0
1037
+ cross_attention_hidden_size: null
1038
+ decoder_start_token_id: null
1039
+ diversity_penalty: 0
1040
+ do_sample: false
1041
+ dtype: null
1042
+ early_stopping: false
1043
+ encoder_no_repeat_ngram_size: 0
1044
+ eos_token_id: null
1045
+ exponential_decay_length_penalty: null
1046
+ finetuning_task: null
1047
+ forced_bos_token_id: null
1048
+ forced_eos_token_id: null
1049
+ head_dim: 128
1050
+ hidden_act: silu
1051
+ hidden_size: 2048
1052
+ id2label:
1053
+ "0": LABEL_0
1054
+ "1": LABEL_1
1055
+ initializer_range: 0.02
1056
+ intermediate_size: 6144
1057
+ is_decoder: false
1058
+ is_encoder_decoder: false
1059
+ label2id:
1060
+ LABEL_0: 0
1061
+ LABEL_1: 1
1062
+ length_penalty: 1
1063
+ max_length: 20
1064
+ max_position_embeddings: 65536
1065
+ min_length: 0
1066
+ model_type: qwen3_asr_text
1067
+ no_repeat_ngram_size: 0
1068
+ num_attention_heads: 16
1069
+ num_beam_groups: 1
1070
+ num_beams: 1
1071
+ num_hidden_layers: 28
1072
+ num_key_value_heads: 8
1073
+ num_return_sequences: 1
1074
+ output_attentions: false
1075
+ output_hidden_states: false
1076
+ output_scores: false
1077
+ pad_token_id: 151643
1078
+ prefix: null
1079
+ problem_type: null
1080
+ remove_invalid_values: false
1081
+ repetition_penalty: 1
1082
+ return_dict: true
1083
+ return_dict_in_generate: false
1084
+ rms_norm_eps: 1e-06
1085
+ rope_scaling:
1086
+ interleaved: true
1087
+ mrope_interleaved: true
1088
+ mrope_section:
1089
+ - 24
1090
+ - 20
1091
+ - 20
1092
+ rope_type: default
1093
+ type: default
1094
+ rope_theta: 1000000
1095
+ sep_token_id: null
1096
+ suppress_tokens: null
1097
+ task_specific_params: null
1098
+ temperature: 1
1099
+ tf_legacy_loss: false
1100
+ tie_encoder_decoder: false
1101
+ tie_word_embeddings: true
1102
+ tokenizer_class: null
1103
+ top_k: 50
1104
+ top_p: 1
1105
+ torchscript: false
1106
+ typical_p: 1
1107
+ use_bfloat16: false
1108
+ use_cache: false
1109
+ vocab_size: 151936
1110
+ tf_legacy_loss: false
1111
+ tie_encoder_decoder: false
1112
+ tie_word_embeddings: true
1113
+ tokenizer_class: null
1114
+ top_k: 50
1115
+ top_p: 1
1116
+ torchscript: false
1117
+ typical_p: 1
1118
+ use_bfloat16: false
1119
+ user_token_id: 872
1120
+ tie_encoder_decoder:
1121
+ value: false
1122
+ tie_word_embeddings:
1123
+ value: true
1124
+ tokenizer_class:
1125
+ value: null
1126
+ top_entropy_quantile:
1127
+ value: 1
1128
+ top_k:
1129
+ value: 50
1130
+ top_p:
1131
+ value: 0.95
1132
+ torch_compile:
1133
+ value: false
1134
+ torch_compile_backend:
1135
+ value: null
1136
+ torch_compile_mode:
1137
+ value: null
1138
+ torch_empty_cache_steps:
1139
+ value: null
1140
+ torchdynamo:
1141
+ value: null
1142
+ torchscript:
1143
+ value: false
1144
+ tpu_metrics_debug:
1145
+ value: false
1146
+ tpu_num_cores:
1147
+ value: null
1148
+ trackio_space_id:
1149
+ value: trackio
1150
+ train_dataloader_shuffle:
1151
+ value: true
1152
+ transformers_version:
1153
+ value: 4.57.6
1154
+ tuner_backend:
1155
+ value: peft
1156
+ tuner_type:
1157
+ value: lora
1158
+ typical_p:
1159
+ value: 1
1160
+ use_bfloat16:
1161
+ value: false
1162
+ use_bias_correction_kl:
1163
+ value: false
1164
+ use_cpu:
1165
+ value: false
1166
+ use_flash_ckpt:
1167
+ value: false
1168
+ use_galore:
1169
+ value: false
1170
+ use_legacy_prediction_loop:
1171
+ value: false
1172
+ use_liger_kernel:
1173
+ value: false
1174
+ use_logits_to_keep:
1175
+ value: null
1176
+ use_mps_device:
1177
+ value: false
1178
+ use_transformers_paged:
1179
+ value: false
1180
+ use_vllm:
1181
+ value: false
1182
+ vit_gradient_checkpointing:
1183
+ value: true
1184
+ vit_lr:
1185
+ value: null
1186
+ vllm_data_parallel_size:
1187
+ value: 1
1188
+ vllm_disable_cascade_attn:
1189
+ value: false
1190
+ vllm_disable_custom_all_reduce:
1191
+ value: true
1192
+ vllm_enable_expert_parallel:
1193
+ value: false
1194
+ vllm_enable_lora:
1195
+ value: false
1196
+ vllm_enable_prefix_caching:
1197
+ value: true
1198
+ vllm_enable_sleep_mode:
1199
+ value: false
1200
+ vllm_enforce_eager:
1201
+ value: false
1202
+ vllm_gpu_memory_utilization:
1203
+ value: 0.9
1204
+ vllm_group_port:
1205
+ value: 51216
1206
+ vllm_importance_sampling_cap:
1207
+ value: 3
1208
+ vllm_importance_sampling_correction:
1209
+ value: true
1210
+ vllm_importance_sampling_mode:
1211
+ value: sequence_mask
1212
+ vllm_limit_mm_per_prompt:
1213
+ value: null
1214
+ vllm_max_lora_rank:
1215
+ value: 16
1216
+ vllm_max_model_len:
1217
+ value: null
1218
+ vllm_max_model_length:
1219
+ value: null
1220
+ vllm_max_num_seqs:
1221
+ value: null
1222
+ vllm_mm_processor_cache_gb:
1223
+ value: null
1224
+ vllm_mode:
1225
+ value: null
1226
+ vllm_model_impl:
1227
+ value: vllm
1228
+ vllm_pipeline_parallel_size:
1229
+ value: 1
1230
+ vllm_quantization:
1231
+ value: null
1232
+ vllm_reasoning_parser:
1233
+ value: null
1234
+ vllm_server_base_url:
1235
+ value: null
1236
+ vllm_server_group_port:
1237
+ value: null
1238
+ vllm_server_host:
1239
+ value: null
1240
+ vllm_server_pass_dataset:
1241
+ value: false
1242
+ vllm_server_port:
1243
+ value:
1244
+ - 8000
1245
+ vllm_server_timeout:
1246
+ value: 240
1247
+ vllm_speculative_config:
1248
+ value: null
1249
+ vllm_structured_outputs_regex:
1250
+ value: null
1251
+ vllm_tensor_parallel_size:
1252
+ value: 1
1253
+ vllm_use_async_engine:
1254
+ value: null
1255
+ wandb_log_unique_prompts:
1256
+ value: null
1257
+ warmup_ratio:
1258
+ value: 0.03
1259
+ warmup_steps:
1260
+ value: 0
1261
+ weight_decay:
1262
+ value: 0.1
wandb/run-20260418_172847-c2a5hfz3/files/media/table/completions_291_2ce0194cf48cadccd2a9.table.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"columns": ["step", "prompt", "completion", "ASRWerSubLenCmpHalluDirtyV56", "advantages", "solution"], "data": [["580", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Captain markham, it's about about my wife. Polly answered, casting down her eyes and returning a very red. The other day, the whistle.<|im_end|>", 0.1822807341814041, -0.8288241028785706, "Captain marker, it's about about my wife. Crawley answered, casting down his eyes and turning very red. The other gave a whistle."], ["580", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Captain marten, it's about about my wife. Crawley answered, casting down his eyes and returning very red. The other gave a whistle.<|im_end|>", 0.7842410206794739, 1.4543499946594238, "Captain marker, it's about about my wife. Crawley answered, casting down his eyes and turning very red. The other gave a whistle."], ["580", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Captain knocker, it's about about my wife. Crawley answered, casting down his eyes and returning a very red the other day, the whistle.<|im_end|>", 0.31845957040786743, -0.31231164932250977, "Captain marker, it's about about my wife. Crawley answered, casting down his eyes and turning very red. The other gave a whistle."], ["580", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Captain Markham, it's about about my wife, Crawley answered, casting down his eyes and returning a very red. The other day, the whistle.<|im_end|>", 0.3182216286659241, -0.31321415305137634, "Captain marker, it's about about my wife. Crawley answered, casting down his eyes and turning very red. The other gave a whistle."], ["580", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>At evening upon the world, while others hint that knowledge of these might undo our civilization. There watched him ceaselessly from the under pits those eyes whose duty it is from further within and deeper.<|im_end|>", 0.8666909337043762, 0.20433472096920013, "At evening upon the world, while others hint that knowledge of these might undo our civilization, there watched him ceaselessly from the under pits, those eyes whose duty it is from further within and deeper."], ["580", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>At evening upon the world, while others hint that knowledge of these might undo our civilization, there watched him ceaselessly from the underpits those eyes whose duty it is, from further within and deeper.<|im_end|>", 0.8165187239646912, -0.6340823769569397, "At evening upon the world, while others hint that knowledge of these might undo our civilization, there watched him ceaselessly from the under pits, those eyes whose duty it is from further within and deeper."], ["580", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>At evening upon the world, while others hint that knowledge of these might undo our civilization, there watched him ceaselessly from the under pits those eyes whose duty it is from further within and deeper.<|im_end|>", 0.9336058497428894, 1.3225356340408325, "At evening upon the world, while others hint that knowledge of these might undo our civilization, there watched him ceaselessly from the under pits, those eyes whose duty it is from further within and deeper."], ["580", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>At evening upon the world, while others hint that knowledge of these might undo our civilization. There watched him ceaselessly from the under pits those eyes whose duty it is, from further within and deeper.<|im_end|>", 0.8010374307632446, -0.8927869200706482, "At evening upon the world, while others hint that knowledge of these might undo our civilization, there watched him ceaselessly from the under pits, those eyes whose duty it is from further within and deeper."], ["580", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Milly steered her magnificent way like some great liner cleaving among the canoes of howling savages. Our goddess of grub was built on lines so majestic that they could be followed only with awe.<|im_end|>", 1.0, 0.0, "Milly steered her magnificent way like some great liner cleaving among the canoes of howling savages. Our goddess of grub was built on lines so majestic that they could be followed only with awe."], ["580", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Milly steered her magnificent way like some great liner cleaving among the canoes of howling savages. Our goddess of grub was built on lines so majestic that they could be followed only with awe.<|im_end|>", 1.0, 0.0, "Milly steered her magnificent way like some great liner cleaving among the canoes of howling savages. Our goddess of grub was built on lines so majestic that they could be followed only with awe."], ["580", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Milly steered her magnificent way like some great liner cleaving among the canoes of howling savages. Our goddess of grub was built on lines so majestic that they could be followed only with awe.<|im_end|>", 1.0, 0.0, "Milly steered her magnificent way like some great liner cleaving among the canoes of howling savages. Our goddess of grub was built on lines so majestic that they could be followed only with awe."], ["580", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Milly steered her magnificent way like some great liner cleaving among the canoes of howling savages. Our goddess of grub was built on lines so majestic that they could be followed only with awe.<|im_end|>", 1.0, 0.0, "Milly steered her magnificent way like some great liner cleaving among the canoes of howling savages. Our goddess of grub was built on lines so majestic that they could be followed only with awe."], ["580", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>And made properly lavish time out of working time. It is not improbable that glossy buttons are a valid feature in the garb of a humdrum and harassed hospital porter. Many intellect.<|im_end|>", 0.11065644025802612, 0.8317853212356567, "And may properly lavish time and trouble thereupon. It is not arguable that glossy buttons are a valid feature of the garb of a humdrum and harassed hospital, orderly many a time."], ["580", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>And may properly lavish time and sport in a pantomime. It is not improbable that glossy buttons are a valid feature of the garb for humdrum and grassy hospitals, or more many intellect.<|im_end|>", -0.05923449248075485, -1.18646240234375, "And may properly lavish time and trouble thereupon. It is not arguable that glossy buttons are a valid feature of the garb of a humdrum and harassed hospital, orderly many a time."], ["580", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>And make properly lavish time out of working time. It is not improbable that glossy buttons are a valid feature in the garb of a humdrum and harassed hospital porter. Many intellect.<|im_end|>", 0.10980796068906784, 0.82170569896698, "And may properly lavish time and trouble thereupon. It is not arguable that glossy buttons are a valid feature of the garb of a humdrum and harassed hospital, orderly many a time."], ["580", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>And may properly lavish time after working upon it is not remarkable that glossy buttons are a valid feature of the garb for humdrum and grassy hospitals or more many intellect.<|im_end|>", 0.0013256088132038713, -0.46702858805656433, "And may properly lavish time and trouble thereupon. It is not arguable that glossy buttons are a valid feature of the garb of a humdrum and harassed hospital, orderly many a time."], ["580", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>And Shahrazad perceived the dawn of day and ceased saying her permitted say when it was the six hundred and seventy seventh night, she pursued it hath reached me o auspicious king that when the kafirs fell upon harib.<|im_end|>", 0.7613571882247925, 1.3583694696426392, "And shahrazad perceived the dawn of day and ceased saying her permitted say. When it was the six hundred and seventy seventh night, she pursued it. Hath reached me o auspicious king, that when the kafirs fell upon gharib."], ["580", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>And Shahrazad perceived the dawn of day and ceased saying her permitted say, when it was the six hundred and seventy seventh night. She pursued, it hath reached me, O auspicious king, that when the kaffirs fell upon Harib.<|im_end|>", 0.5681424736976624, -1.0484904050827026, "And shahrazad perceived the dawn of day and ceased saying her permitted say. When it was the six hundred and seventy seventh night, she pursued it. Hath reached me o auspicious king, that when the kafirs fell upon gharib."], ["580", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>And Shahrazad perceived the dawn of day and ceased saying her permitted say when it was the six hundred and seventy seventh night she pursued, it hath reached me o auspicious king that when the kafirs fell upon Harib.<|im_end|>", 0.6401126384735107, -0.1519639790058136, "And shahrazad perceived the dawn of day and ceased saying her permitted say. When it was the six hundred and seventy seventh night, she pursued it. Hath reached me o auspicious king, that when the kafirs fell upon gharib."], ["580", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>And Shahrazad perceived the dawn of day and ceased saying her permitted say, when it was the six hundred and seventy seventh night she pursued, it hath reached me o auspicious king that when the kafirs fell upon harib.<|im_end|>", 0.6396347880363464, -0.15791653096675873, "And shahrazad perceived the dawn of day and ceased saying her permitted say. When it was the six hundred and seventy seventh night, she pursued it. Hath reached me o auspicious king, that when the kafirs fell upon gharib."], ["580", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>beasy would make reply but was from a certain person whom perhaps we need not name then the whiskey bottle would move forward like a pawn in chess and the next suaded words would be<|im_end|>", 0.8032140731811523, 0.47693824768066406, "deasey would make reply but twas from a certain person whom perhaps we need not name then the whiskey bottle would move forward like a pawn in chess and the next soothing words would be"], ["580", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>beasley would make reply, but was from a certain person whom perhaps we need not name then the whiskey bottle would move forward like a pawn in chess and the next soothing words would be<|im_end|>", 0.8078052401542664, 0.5542405247688293, "deasey would make reply but twas from a certain person whom perhaps we need not name then the whiskey bottle would move forward like a pawn in chess and the next soothing words would be"], ["580", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>these he would make reply, but was from a certain person whom perhaps we need not name then the whiskey bottle would move forward like a pawn in chess and the next suaded words would be<|im_end|>", 0.6860186457633972, -1.4963009357452393, "deasey would make reply but twas from a certain person whom perhaps we need not name then the whiskey bottle would move forward like a pawn in chess and the next soothing words would be"], ["580", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>hezekiah would make reply but was from a certain person whom perhaps we need not name then the whiskey bottle would move forward like a palm in chess and the next soothing words would be<|im_end|>", 0.8025121688842773, 0.4651201665401459, "deasey would make reply but twas from a certain person whom perhaps we need not name then the whiskey bottle would move forward like a pawn in chess and the next soothing words would be"], ["580", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>He did in fact begin it when setting out on the aforementioned second trip to Europe, calling it.<|im_end|>", 0.7412750124931335, -0.7827419638633728, "He did, in fact, begin it when setting out on the aforementioned second trip to europe, calling it."], ["580", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>He did, in fact, begin it when setting out on the aforementioned second trip to Europe calling it.<|im_end|>", 0.8706542253494263, 0.26100391149520874, "He did, in fact, begin it when setting out on the aforementioned second trip to europe, calling it."], ["580", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>He did, in fact, begin it when setting out on the aforementioned second trip to Europe, calling it.<|im_end|>", 1.0, 1.3044800758361816, "He did, in fact, begin it when setting out on the aforementioned second trip to europe, calling it."], ["580", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>He did in fact begin it when setting out on the aforementioned second trip to Europe, calling it.<|im_end|>", 0.7412750124931335, -0.7827419638633728, "He did, in fact, begin it when setting out on the aforementioned second trip to europe, calling it."], ["580", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Bayard knew that his master was upon him, and he started off upon a rapid pace. And in a few moments, he had galloped. Malagigi pretended to be in great alarm. O noble king and master, he cried, my poor companion has run away with. He will fall and break his neck.<|im_end|>", 0.45684748888015747, 1.159354329109192, "Bayard knew that his master was upon him, and he started off upon a rapid pace, and in a few moments was a good way off. Malagigi pretended to be in great alarm o, noble king and master. He cried, my poor companion is run away with he will fall and break his neck."], ["580", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Fayard knew that his master was upon him, and he started off upon a rapid pace. And in a few moments, he had galloped on. Malagigi pretended to be in great alarm. O noble king and master, he cried, my poor companion has run away with. He will fall and break his neck.<|im_end|>", 0.3951204717159271, -0.9790310263633728, "Bayard knew that his master was upon him, and he started off upon a rapid pace, and in a few moments was a good way off. Malagigi pretended to be in great alarm o, noble king and master. He cried, my poor companion is run away with he will fall and break his neck."], ["580", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Fayard knew that his master was upon him, and he started off upon a rapid pace. And in a few moments, he had galloped away. Malagigi pretended to be in great alarm. O noble king and master, he cried, my poor companion has run away with me. He will fall and break his neck.<|im_end|>", 0.4041914939880371, -0.6647871136665344, "Bayard knew that his master was upon him, and he started off upon a rapid pace, and in a few moments was a good way off. Malagigi pretended to be in great alarm o, noble king and master. He cried, my poor companion is run away with he will fall and break his neck."], ["580", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Vaillard knew that his master was upon him, and he started off upon a rapid pace. And in a few moments of he did run off malagigi pretended to be in great alarm. O noble king and master, he cried, my poor companion has run away with. He will fall and break his neck.<|im_end|>", 0.43736597895622253, 0.4844638407230377, "Bayard knew that his master was upon him, and he started off upon a rapid pace, and in a few moments was a good way off. Malagigi pretended to be in great alarm o, noble king and master. He cried, my poor companion is run away with he will fall and break his neck."], ["580", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>She laid a firm, delicate hand on her gold green jerkin. Ellidore. This was pleasant, but we got no nearer. We can't sit here and learn the language. Terry protested.<|im_end|>", 0.9188264608383179, 0.447922945022583, "She laid a firm, delicate hand on her gold green jerkin. Ellador, this was pleasant, but we got no nearer. We can't sit here and learn the language. Terry protested."], ["580", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>She laid a firm, delicate hand on her gold green jerkin. Ellador, this was pleasant. But we got no nearer. We can't sit here and learn the language. Terry protested.<|im_end|>", 0.9217362999916077, 0.5236092805862427, "She laid a firm, delicate hand on her gold green jerkin. Ellador, this was pleasant, but we got no nearer. We can't sit here and learn the language. Terry protested."], ["580", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>She laid a firm, delicate hand on her gold green jerkin ellador. This was pleasant, but we got no nearer. We can't sit here and learn the language. Terry protested.<|im_end|>", 0.8441234230995178, -1.4951399564743042, "She laid a firm, delicate hand on her gold green jerkin. Ellador, this was pleasant, but we got no nearer. We can't sit here and learn the language. Terry protested."], ["580", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>She laid a firm, delicate hand on her gold green jerkin. Ellador, this was pleasant. But we got no nearer. We can't sit here and learn the language. Terry protested.<|im_end|>", 0.9217362999916077, 0.5236092805862427, "She laid a firm, delicate hand on her gold green jerkin. Ellador, this was pleasant, but we got no nearer. We can't sit here and learn the language. Terry protested."], ["580", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>he cried out savage and fought and struggled two minutes however he did little against his four adversaries and worn out with his struggle flat suddenly from the dusty floor with emotion in spirit lost lost he muttered all lost<|im_end|>", 0.09937235713005066, 0.43719542026519775, "he cried out savagely and fought with the strength of two men however he could do little against his four adversaries and worn out with the struggle collapsed suddenly on to the dusty floor with a motion of despair lost lost he muttered all lost"], ["580", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>he cried out sadly and fought and strangled two men however he did little against four adversaries the worn out with his struggle flat suddenly upon the dusty floor with emotion in his spirit lost lost he muttered all lost<|im_end|>", 0.03799943998456001, -0.10167413204908371, "he cried out savagely and fought with the strength of two men however he could do little against his four adversaries and worn out with the struggle collapsed suddenly on to the dusty floor with a motion of despair lost lost he muttered all lost"], ["580", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>he cried out savage and fought and strangled two men however he did little against four adversaries and worn out with his struggle flat suddenly on the dusty floor with emotion in his spirit lost lost he muttered all lost<|im_end|>", 0.16370610892772675, 1.0020618438720703, "he cried out savagely and fought with the strength of two men however he could do little against his four adversaries and worn out with the struggle collapsed suddenly on to the dusty floor with a motion of despair lost lost he muttered all lost"], ["580", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>he cried out savagely and fought and struggled two minutes however with little against four adversaries and worn out of his breath, platt suddenly among the dusty floor with emotion in his spirit lost lost he muttered all lost<|im_end|>", -0.1027606725692749, -1.337583065032959, "he cried out savagely and fought with the strength of two men however he could do little against his four adversaries and worn out with the struggle collapsed suddenly on to the dusty floor with a motion of despair lost lost he muttered all lost"], ["580", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>And thus he accomplished this by the bye during the siege of the city, for he had his enemies in great contempt already. Nine when he had thus married Mariamne.<|im_end|>", 0.6356512308120728, -0.49875012040138245, "And thus he accomplished this by the by, during the siege of the city. For he had his enemies in great contempt already nine when he had thus married mariamne, he."], ["580", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>And thus he accomplished this by the bye during the siege of the city, for he had his enemies in great contempt already. Nine when he had thus married Mariamne.<|im_end|>", 0.6356512308120728, -0.49875012040138245, "And thus he accomplished this by the by, during the siege of the city. For he had his enemies in great contempt already nine when he had thus married mariamne, he."], ["580", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>And thus he accomplished this by the bye during the siege of the city, for he had his enemies in great contempt already nine when he had thus married mariamne.<|im_end|>", 0.715508222579956, 1.4962533712387085, "And thus he accomplished this by the by, during the siege of the city. For he had his enemies in great contempt already nine when he had thus married mariamne, he."], ["580", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>And thus he accomplished this by the bye during the siege of the city, for he had his enemies in great contempt already. Nine when he had thus married Mariamne.<|im_end|>", 0.6356512308120728, -0.49875012040138245, "And thus he accomplished this by the by, during the siege of the city. For he had his enemies in great contempt already nine when he had thus married mariamne, he."], ["580", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Putting both hands on her shoulders and looking into the brown eyes, should you be willing to go abroad with your mother and phronsie, mister king and jasper? Oh Polly gasped, but you.<|im_end|>", 0.9294845461845398, 0.7829669117927551, "Putting both hands on her shoulders and looking into the brown eyes, should you be willing to go abroad with your mother and phronsie, mister king and jasper? Oh, polly gasped, but you."], ["580", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Putting both hands on her shoulders and looking into the brown eyes, should you be willing to go abroad with your mother and phronsie mister king and jasper? Oh Polly gasped. But you.<|im_end|>", 0.7878445386886597, -1.3021132946014404, "Putting both hands on her shoulders and looking into the brown eyes, should you be willing to go abroad with your mother and phronsie, mister king and jasper? Oh, polly gasped, but you."], ["580", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Putting both hands on her shoulders and looking into the brown eyes, should you be willing to go abroad with your mother and phronsie, mister king and jasper? Oh Polly gasped, but you.<|im_end|>", 0.9294845461845398, 0.7829669117927551, "Putting both hands on her shoulders and looking into the brown eyes, should you be willing to go abroad with your mother and phronsie, mister king and jasper? Oh, polly gasped, but you."], ["580", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Putting both hands on her shoulders and looking into the brown eyes, should you be willing to go abroad with your mother and phronsie, mister king and jasper? Oh Polly gasped. But you.<|im_end|>", 0.858376145362854, -0.2638187110424042, "Putting both hands on her shoulders and looking into the brown eyes, should you be willing to go abroad with your mother and phronsie, mister king and jasper? Oh, polly gasped, but you."]]}
wandb/run-20260418_172847-c2a5hfz3/files/media/table/completions_297_2c3b42b29065c75ff192.table.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"columns": ["step", "prompt", "completion", "ASRWerSubLenCmpHalluDirtyV56", "advantages", "solution"], "data": [["595", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>The underling had insufficient, gave orders to the coachman and being readiness on the stairs took him up to his post. The steed balked and was about to kick the whip, ah, does he indicate?<|im_end|>", -0.5885342359542847, 0.47900471091270447, "You have the window. That is sufficient give orders to the coachman and be in readiness on the stairs to conduct us to it. The steward bowed and was about to quit the room. Ah continued the count."], ["595", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>The underling added sufficient, gave orders to the coachman and being readiness on the stairs took him up the steps. The steed balked and was about to caper, ah, it is a wonder good.<|im_end|>", -0.7021157145500183, 0.06742512434720993, "You have the window. That is sufficient give orders to the coachman and be in readiness on the stairs to conduct us to it. The steward bowed and was about to quit the room. Ah continued the count."], ["595", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>The underling was satisfied, gave orders to the coachman and being readiness on the stairs took him up the steps. The steed balked and was about to caper. Bah! Does he indeed?<|im_end|>", -0.7042824625968933, 0.05957358703017235, "You have the window. That is sufficient give orders to the coachman and be in readiness on the stairs to conduct us to it. The steward bowed and was about to quit the room. Ah continued the count."], ["595", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>The underling had insufficient the orders for capture and being readiness on the stairs took a left of straight the steed balked and was about to capitulate, ah, it is my defeat.<|im_end|>", -0.968815267086029, -0.899000883102417, "You have the window. That is sufficient give orders to the coachman and be in readiness on the stairs to conduct us to it. The steward bowed and was about to quit the room. Ah continued the count."], ["595", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>The underling had insufficient. He ordered for patron and being readiness on the stairs to connect his trunk, he steered back, and was about to return, but, as I indicated.<|im_end|>", -1.0357601642608643, -1.1415858268737793, "You have the window. That is sufficient give orders to the coachman and be in readiness on the stairs to conduct us to it. The steward bowed and was about to quit the room. Ah continued the count."], ["595", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>The underling was very sufficient. He ordered his detachment, and being readiness on the stairs took a left of straits. The steed balked and was about to fall off. Bah! There is no end to it.<|im_end|>", -1.0646944046020508, -1.2464333772659302, "You have the window. That is sufficient give orders to the coachman and be in readiness on the stairs to conduct us to it. The steward bowed and was about to quit the room. Ah continued the count."], ["595", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>The underling, and is sufficient. Give orders to the coachman in being readiness on the stairs to conduct us straight. The steer barked and was about to get up. Ah, there's a winded goat.<|im_end|>", -0.35244596004486084, 1.3345061540603638, "You have the window. That is sufficient give orders to the coachman and be in readiness on the stairs to conduct us to it. The steward bowed and was about to quit the room. Ah continued the count."], ["595", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>The underling was not sufficient. He ordered the patrol, and being readiness on the stairs, took him up the steps. The steamer backed, and he had about to put in, bah! There is no engine.<|im_end|>", -1.093247413635254, -1.3498995304107666, "You have the window. That is sufficient give orders to the coachman and be in readiness on the stairs to conduct us to it. The steward bowed and was about to quit the room. Ah continued the count."], ["595", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>The underling added sufficient, gave orders to the coachman and being readiness on the stairs took a left of stroke. The steer barked and was about to click away. Ah, there's my underling.<|im_end|>", -0.7040185928344727, 0.06052975729107857, "You have the window. That is sufficient give orders to the coachman and be in readiness on the stairs to conduct us to it. The steward bowed and was about to quit the room. Ah continued the count."], ["595", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>The underling, that is sufficient, give orders to the coachman and be in readiness on the stairs to conduct us straight. The steed balks when he is about to pick up baas, his wounded feet.<|im_end|>", -0.28640249371528625, 1.5738246440887451, "You have the window. That is sufficient give orders to the coachman and be in readiness on the stairs to conduct us to it. The steward bowed and was about to quit the room. Ah continued the count."], ["595", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>The underling had insufficient, gave orders to the coachman and being readiness on the stairs took him up the steps. The steed balked and was about to kick her, but his rider kicked.<|im_end|>", -0.7038772106170654, 0.06104207783937454, "You have the window. That is sufficient give orders to the coachman and be in readiness on the stairs to conduct us to it. The steward bowed and was about to quit the room. Ah continued the count."], ["595", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>The underling was satisfied, gave orders for the coachman and being readiness on the stairs to conduct us to it. The steed balked and laid about the cookelard, but his lamentations.<|im_end|>", -0.44447875022888184, 1.0010114908218384, "You have the window. That is sufficient give orders to the coachman and be in readiness on the stairs to conduct us to it. The steward bowed and was about to quit the room. Ah continued the count."], ["595", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>About three claims to hand tom was familiar with most of these claims, but occasionally would see a new one that excited his curiosity. However, he was more interested in what Andy Foger had to manage andy's machine had not been tried. Tom Warner only dared risk five minutes.<|im_end|>", 0.0947486162185669, 0.5240245461463928, "With three planes behind. Tom was familiar with most of these types, but occasionally he saw a new one that excited his curiosity. However, he was more interested in what andy foger would turn out. Andy's machine had not been tried, and tom wondered how he dared risk flying in it."], ["595", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>But three claims to hands, tom was familiar with most of these claims, but occasionally would see a new one that excited his curiosity. However, he was more interested in what Andy Foger had to invent. Andy's machine had not been tried. Tom Warner only dared risk five minutes.<|im_end|>", 0.09490512311458588, 0.5261728763580322, "With three planes behind. Tom was familiar with most of these types, but occasionally he saw a new one that excited his curiosity. However, he was more interested in what andy foger would turn out. Andy's machine had not been tried, and tom wondered how he dared risk flying in it."], ["595", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>At three claims to hand, Tom was familiar with most of these claims, but occasionally would see a new one that excited his curiosity. However, he was more interested in what Andy Foger had to invent. Andy's machine had not been tried. Tom Warner only dared it once for five minutes.<|im_end|>", -0.04116278141736984, -1.3415790796279907, "With three planes behind. Tom was familiar with most of these types, but occasionally he saw a new one that excited his curiosity. However, he was more interested in what andy foger would turn out. Andy's machine had not been tried, and tom wondered how he dared risk flying in it."], ["595", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>About three claims to hand, tom was familiar with most of these claims, but occasionally would see a new one that excited his curiosity. However, he was more interested in what Andy Foger had to manage. Andy's machine had not been tried. Tom Warner only dared risk flying minutes.<|im_end|>", 0.15220792591571808, 1.3127464056015015, "With three planes behind. Tom was familiar with most of these types, but occasionally he saw a new one that excited his curiosity. However, he was more interested in what andy foger would turn out. Andy's machine had not been tried, and tom wondered how he dared risk flying in it."], ["595", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>About three claims to hand, tom was familiar with most of these claims, but occasionally would see a new one that excited his curiosity. However, he was more interested in what Andy Foger had to manage. Andy's machinery had not been tried. Tom wondered why the era was applying minutes.<|im_end|>", -0.027287397533655167, -1.1511170864105225, "With three planes behind. Tom was familiar with most of these types, but occasionally he saw a new one that excited his curiosity. However, he was more interested in what andy foger would turn out. Andy's machine had not been tried, and tom wondered how he dared risk flying in it."], ["595", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>But three claims to hand tom was familiar with most of these claims, but occasionally would see a new one that excited his curiosity. However, he was more interested in what Andy Foger had to invent. Andy's machine had not been tried. Tom Warner only dared risk flying minutes.<|im_end|>", 0.153399258852005, 1.329099416732788, "With three planes behind. Tom was familiar with most of these types, but occasionally he saw a new one that excited his curiosity. However, he was more interested in what andy foger would turn out. Andy's machine had not been tried, and tom wondered how he dared risk flying in it."], ["595", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>But three claims to hand tom was familiar with most of these claims, but occasionally would see a new one that excited his curiosity. However, he was more interested in what Andy Foger had to manage. Andy's machine had not been tried. Tom Warner only dared risk flying minutes.<|im_end|>", 0.1526142656803131, 1.318324089050293, "With three planes behind. Tom was familiar with most of these types, but occasionally he saw a new one that excited his curiosity. However, he was more interested in what andy foger would turn out. Andy's machine had not been tried, and tom wondered how he dared risk flying in it."], ["595", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>But three claims to hand tom was familiar with most of these claims, but occasionally would see a new one that excited his curiosity. However, he was more interested in what Andy Foger had to invent. Andy's machine had not been tried. Tom Warner would only dare to risk five minutes.<|im_end|>", -0.037495389580726624, -1.2912381887435913, "With three planes behind. Tom was familiar with most of these types, but occasionally he saw a new one that excited his curiosity. However, he was more interested in what andy foger would turn out. Andy's machine had not been tried, and tom wondered how he dared risk flying in it."], ["595", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>About three claims to hand tom was familiar with most of these claims, but occasionally would see a new one that excited his curiosity. However, he was more interested in what Andy Foger had to manage andy's machine had not been tried. Tom marvelled at the daring riskful flying minutes.<|im_end|>", 0.026256464421749115, -0.41614094376564026, "With three planes behind. Tom was familiar with most of these types, but occasionally he saw a new one that excited his curiosity. However, he was more interested in what andy foger would turn out. Andy's machine had not been tried, and tom wondered how he dared risk flying in it."], ["595", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>At three times the hands tom was familiar with most of these points, but occasionally would see a new one that excited his curiosity. However, he was more interested in what Andy Foger had to invent. Andy's machine had not been tried. Tom Warner would only dare risk five minutes.<|im_end|>", 0.03246723860502243, -0.330888032913208, "With three planes behind. Tom was familiar with most of these types, but occasionally he saw a new one that excited his curiosity. However, he was more interested in what andy foger would turn out. Andy's machine had not been tried, and tom wondered how he dared risk flying in it."], ["595", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>At three times to hand tom was familiar with most of these points, but occasionally would see a new one that excited his curiosity. However, he was more interested in what Andy Foger was doing. Andy's machine had not been tried. Tom Warner only dared to whistle five minutes.<|im_end|>", 0.04056717827916145, -0.21970325708389282, "With three planes behind. Tom was familiar with most of these types, but occasionally he saw a new one that excited his curiosity. However, he was more interested in what andy foger would turn out. Andy's machine had not been tried, and tom wondered how he dared risk flying in it."], ["595", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>About three claims to hand tom was familiar with most of these claims, but occasionally would see a new one that excited his curiosity. However, he was more interested in what Andy Foger had to manage andy's machinery had not been tried. Tom Warner only dared risk five minutes.<|im_end|>", 0.03765326738357544, -0.2597014009952545, "With three planes behind. Tom was familiar with most of these types, but occasionally he saw a new one that excited his curiosity. However, he was more interested in what andy foger would turn out. Andy's machine had not been tried, and tom wondered how he dared risk flying in it."], ["595", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Even had they wished to do it, which remains doubtful. She came behind the wicked grovendam and twisted her neck just as a quick bell of iron dared aspire.<|im_end|>", 0.1723645180463791, -0.36288517713546753, "Even had they wished to do it, which remains doubtful, she came behind the wicked grognon and twisted her neck, just as a cook does a barn door fowl."], ["595", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Even had they wished to do it, which remains doubtful. She came behind the wicked greggong and twisted her neck just as a quick bell of iron gave a sigh.<|im_end|>", 0.09226466715335846, -1.601252555847168, "Even had they wished to do it, which remains doubtful, she came behind the wicked grognon and twisted her neck, just as a cook does a barn door fowl."], ["595", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Even had they wished to do it, which remains doubtful, she came behind the wicked grovden and twisted her neck just as a quick bell of burning barrel fire.<|im_end|>", 0.27071085572242737, 1.1575783491134644, "Even had they wished to do it, which remains doubtful, she came behind the wicked grognon and twisted her neck, just as a cook does a barn door fowl."], ["595", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Even had they wished to do it, which remains doubtful, she came behind the wicked grovding and twisted her neck just as a quick bell of iron dare fire.<|im_end|>", 0.27202051877975464, 1.177826166152954, "Even had they wished to do it, which remains doubtful, she came behind the wicked grognon and twisted her neck, just as a cook does a barn door fowl."], ["595", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Even had they wished to do it, which remains doubtful she came behind the wicked greggion and twisted her neck just as a quick bell of iron dared fire.<|im_end|>", 0.1751171350479126, -0.32032889127731323, "Even had they wished to do it, which remains doubtful, she came behind the wicked grognon and twisted her neck, just as a cook does a barn door fowl."], ["595", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Even had they wished to do it, which remains doubtful, she came behind the wicked greggion and twisted her neck just as a quick bell of burning death died.<|im_end|>", 0.26866206526756287, 1.1259034872055054, "Even had they wished to do it, which remains doubtful, she came behind the wicked grognon and twisted her neck, just as a cook does a barn door fowl."], ["595", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Even had they wished to do it, which remains doubtful, she came behind the wicked gregg dawn and twisted her neck just as a quick bell of iron dare fire.<|im_end|>", 0.19315652549266815, -0.04143457114696503, "Even had they wished to do it, which remains doubtful, she came behind the wicked grognon and twisted her neck, just as a cook does a barn door fowl."], ["595", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Even had they wished to do it, which remains doubtful. She came behind the wicked grovendal and twisted her neck just as a quick bell of iron dared fire.<|im_end|>", 0.17351007461547852, -0.34517452120780945, "Even had they wished to do it, which remains doubtful, she came behind the wicked grognon and twisted her neck, just as a cook does a barn door fowl."], ["595", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Even had they wished to do it, which remains doubtful. She came behind the wicked gregg dawn and twisted her neck just as a quick bell of barren derrick sound.<|im_end|>", 0.09223079681396484, -1.6017762422561646, "Even had they wished to do it, which remains doubtful, she came behind the wicked grognon and twisted her neck, just as a cook does a barn door fowl."], ["595", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Even had they wished to do it, which remains doubtful. She came behind the wicked greggong and twisted her neck just as a quick bell of ironbare fire.<|im_end|>", 0.19122624397277832, -0.07127729803323746, "Even had they wished to do it, which remains doubtful, she came behind the wicked grognon and twisted her neck, just as a cook does a barn door fowl."], ["595", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Even had they wished to do it, which remains doubtful, she came behind the wicked grogman and twisted her neck just as a quick bell of burning barrel fire.<|im_end|>", 0.2721707224845886, 1.1801483631134033, "Even had they wished to do it, which remains doubtful, she came behind the wicked grognon and twisted her neck, just as a cook does a barn door fowl."], ["595", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Even had they wished to do it, which remains doubtful. She came behind the wicked grogman and twisted her neck just as a quick bell of iron dared sound.<|im_end|>", 0.17660479247570038, -0.29732927680015564, "Even had they wished to do it, which remains doubtful, she came behind the wicked grognon and twisted her neck, just as a cook does a barn door fowl."], ["595", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Though just yet none ventured to follow us, it was as though they felt that to do so would be crossing their own line. I wonder whether they might have considered this with any intrepidation or perhaps sullen satisfaction if they had had any chance to reward anybody for following me.<|im_end|>", -0.30214083194732666, -0.016384782269597054, "Though just yet none ventured to follow us. It was as though they felt that to do so was like crossing a dead line. I wondered which one of them might be looking at us with inward trepidation, or perhaps satisfaction, if there had been any chance to remove anything incriminating."], ["595", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Though just yet none ventured to follow us, it was as though they felt that to do so would be crossing their beloved. I wondered whether they might have considered this with any trepidation or perhaps self hatred if they had had any chance to avoid any further trouble.<|im_end|>", -0.24527063965797424, 0.48843005299568176, "Though just yet none ventured to follow us. It was as though they felt that to do so was like crossing a dead line. I wondered which one of them might be looking at us with inward trepidation, or perhaps satisfaction, if there had been any chance to remove anything incriminating."], ["595", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Though just yet none ventured to follow us, it was as though they felt that to do so would be crossing their beloved I wondered whether they might have acknowledged with any approbation or perhaps satisfaction if they had had any chance to reward anybody for coming.<|im_end|>", -0.18428294360637665, 1.0297943353652954, "Though just yet none ventured to follow us. It was as though they felt that to do so was like crossing a dead line. I wondered which one of them might be looking at us with inward trepidation, or perhaps satisfaction, if there had been any chance to remove anything incriminating."], ["595", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Though just yet none ventured to follow us, it was as though they felt the security of that crossing had been lost. I wondered whether they might have evaded us with any more deliberation or perhaps fast fetched if they had had any chance to avoid anything approaching me.<|im_end|>", -0.40226879715919495, -0.9051822423934937, "Though just yet none ventured to follow us. It was as though they felt that to do so was like crossing a dead line. I wondered which one of them might be looking at us with inward trepidation, or perhaps satisfaction, if there had been any chance to remove anything incriminating."], ["595", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Though just yet, none ventured to follow us. It was as though they felt it to be folly without crossing the blue line. I wondered whether they might have evaded us with any more preparation, or perhaps fell afresh if they had got any chance to avoid anything before them.<|im_end|>", -0.29436060786247253, 0.052677273750305176, "Though just yet none ventured to follow us. It was as though they felt that to do so was like crossing a dead line. I wondered which one of them might be looking at us with inward trepidation, or perhaps satisfaction, if there had been any chance to remove anything incriminating."], ["595", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Though just yet, none ventured to follow us. It was as though they felt it to be folly that crossing the blue line. I wondered if even then my little visitors would any more trepidation or perhaps self hatred, if they had but any chance to avoid anything like fear.<|im_end|>", -0.45500248670578003, -1.3732788562774658, "Though just yet none ventured to follow us. It was as though they felt that to do so was like crossing a dead line. I wondered which one of them might be looking at us with inward trepidation, or perhaps satisfaction, if there had been any chance to remove anything incriminating."], ["595", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Though just yet none ventured to follow us, it was as though they felt that to do so would be crossing their beloved. I wondered whether they might have encountered us with any more trepidation or perhaps sarsfetched if they had had any chance to avoid anybody in the crowd.<|im_end|>", -0.23299074172973633, 0.5974339842796326, "Though just yet none ventured to follow us. It was as though they felt that to do so was like crossing a dead line. I wondered which one of them might be looking at us with inward trepidation, or perhaps satisfaction, if there had been any chance to remove anything incriminating."], ["595", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Though just yet, none ventured to follow us. It was as though they felt that to do so would be crossing their beloved. I wondered whether they might have lived with us in more consideration or perhaps satisfied if they had had any chance to reward anybody for coming.<|im_end|>", -0.2098255306482315, 0.8030626773834229, "Though just yet none ventured to follow us. It was as though they felt that to do so was like crossing a dead line. I wondered which one of them might be looking at us with inward trepidation, or perhaps satisfaction, if there had been any chance to remove anything incriminating."], ["595", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Though just yet, none ventured to follow us. It was as though they felt it to be far as if crossing forbidden lines. I wondered whether they might have evaded us with equal precipitation, or perhaps fast fetched, if they had but any chance to avoid anything from following.<|im_end|>", -0.3078778386116028, -0.06730998307466507, "Though just yet none ventured to follow us. It was as though they felt that to do so was like crossing a dead line. I wondered which one of them might be looking at us with inward trepidation, or perhaps satisfaction, if there had been any chance to remove anything incriminating."], ["595", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Though just yet, none ventured to follow us. It was as though they felt it would be folly without crossing the blue line. I wondered whether they might have regarded us with any trepidation, or perhaps, self-reproach, if they had had any chance to observe anything of our manner.<|im_end|>", -0.30904507637023926, -0.0776711031794548, "Though just yet none ventured to follow us. It was as though they felt that to do so was like crossing a dead line. I wondered which one of them might be looking at us with inward trepidation, or perhaps satisfaction, if there had been any chance to remove anything incriminating."], ["595", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Though just yet, none ventured to follow us. It was as though they felt it to be folly to cross over the divide. I wonder whether they might have lived with us any more. Preparation or perhaps self, fetched if they had had any chance to avoid anything from harm.<|im_end|>", -0.5224043726921082, -1.9715795516967773, "Though just yet none ventured to follow us. It was as though they felt that to do so was like crossing a dead line. I wondered which one of them might be looking at us with inward trepidation, or perhaps satisfaction, if there had been any chance to remove anything incriminating."], ["595", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Though just yet none ventured to follow us, it was as though they felt that to do so would be crossing their own line. I wondered whether they might have taken us with any more trepidation or perhaps sarsfetched if they had had any chance to avoid anybody pursuing them.<|im_end|>", -0.13807019591331482, 1.440007209777832, "Though just yet none ventured to follow us. It was as though they felt that to do so was like crossing a dead line. I wondered which one of them might be looking at us with inward trepidation, or perhaps satisfaction, if there had been any chance to remove anything incriminating."]]}
wandb/run-20260418_172847-c2a5hfz3/files/media/table/completions_325_dedd0bb2cd2d27e14a92.table.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"columns": ["step", "prompt", "completion", "ASRWerSubLenCmpHalluDirtyV56", "advantages", "solution"], "data": [["650", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>But that, that's the same old lying doll thing. London is like a port of the sea place of temptation, there's pitfalls for men and traps for money in every turn, as I've heard say.<|im_end|>", -0.4760620892047882, 0.19658391177654266, "But if that's the frame o mind thou'rt in lunnon is like for to be a sore place o temptation. There's pitfalls for men and traps for money at ivery turn. As I've heerd say."], ["650", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>But that's the same old lying down I do running is like a port of the sole place of temptation there's pitfalls for men and traps for money in every turn, as I've got said.<|im_end|>", -0.6135305762290955, -0.7280290126800537, "But if that's the frame o mind thou'rt in lunnon is like for to be a sore place o temptation. There's pitfalls for men and traps for money at ivery turn. As I've heerd say."], ["650", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>But that that's the same, a lying gal. I think running is likely more to be a safe place of temptation there's pitfalls for men and traps for money in every turn as i've heard say.<|im_end|>", -0.35690099000930786, 0.9980613589286804, "But if that's the frame o mind thou'rt in lunnon is like for to be a sore place o temptation. There's pitfalls for men and traps for money at ivery turn. As I've heerd say."], ["650", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>But that's the same old lying gallant thing running his life for to be a safe place of temptation, there's pitfalls for men and traps for money in every turn as I've got said.<|im_end|>", -0.3606083393096924, 0.973125696182251, "But if that's the frame o mind thou'rt in lunnon is like for to be a sore place o temptation. There's pitfalls for men and traps for money at ivery turn. As I've heerd say."], ["650", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>But if that's the same a lion, thou art in running is like as well to the escape place of temptation, there's pitfalls for men and traps for money in every turn, as I thought fit.<|im_end|>", -0.5472695827484131, -0.2823576331138611, "But if that's the frame o mind thou'rt in lunnon is like for to be a sore place o temptation. There's pitfalls for men and traps for money at ivery turn. As I've heerd say."], ["650", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>But that, that's the same old lying doll thing running his life for to be a safe place of temptation. There's pitfalls for men and traps for money in every turn as I've heard said.<|im_end|>", -0.28626200556755066, 1.4731791019439697, "But if that's the frame o mind thou'rt in lunnon is like for to be a sore place o temptation. There's pitfalls for men and traps for money at ivery turn. As I've heerd say."], ["650", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>But that's the same old lying gal again. London is like a port of the sea, place of temptation, there's pitfalls for money and traps for money in every turn as I've said before.<|im_end|>", -0.6403212547302246, -0.9082230925559998, "But if that's the frame o mind thou'rt in lunnon is like for to be a sore place o temptation. There's pitfalls for men and traps for money at ivery turn. As I've heerd say."], ["650", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>But that, that's the same old lion. Thou art in London is like a port to the sea place of temptation. There's pitfalls for men and traps for money in every turn, as I thought fit.<|im_end|>", -0.5447036623954773, -0.26509925723075867, "But if that's the frame o mind thou'rt in lunnon is like for to be a sore place o temptation. There's pitfalls for men and traps for money at ivery turn. As I've heerd say."], ["650", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>But if that's the same, a lion bawling running is likely more to be a safe place of temptation there's pitfalls for men and traps for money in every turn as I have said before.<|im_end|>", -0.42995119094848633, 0.5067257881164551, "But if that's the frame o mind thou'rt in lunnon is like for to be a sore place o temptation. There's pitfalls for men and traps for money at ivery turn. As I've heerd say."], ["650", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>But if that's the same old lion, thou art in running is like a sport of the ill place of temptation. There's pitfalls for men and traps for money in every turn as I thought said.<|im_end|>", -0.45117539167404175, 0.3639717996120453, "But if that's the frame o mind thou'rt in lunnon is like for to be a sore place o temptation. There's pitfalls for men and traps for money at ivery turn. As I've heerd say."], ["650", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>But that, that's the same old lying gal up in London is like a port of the sea place of temptation. There's pitfalls for money and traps for money in every turn as I've got to say.<|im_end|>", -0.5213723182678223, -0.10817265510559082, "But if that's the frame o mind thou'rt in lunnon is like for to be a sore place o temptation. There's pitfalls for men and traps for money at ivery turn. As I've heerd say."], ["650", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>But that, that's the same old lion gallant thing runnin his life all through this old place of temptation, there's pitfalls for men and traps for men in every turn as I've got said.<|im_end|>", -0.8353171944618225, -2.2197656631469727, "But if that's the frame o mind thou'rt in lunnon is like for to be a sore place o temptation. There's pitfalls for men and traps for money at ivery turn. As I've heerd say."], ["650", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>i saw but few inhabitants during my excursion and i met a crowd of them actually drying and salting and loading codfish, the principal article of exportation<|im_end|>", 0.450447678565979, 1.2203410863876343, "i saw but few inhabitants during my excursion but i met a crowd on the beach drying salting and loading codfish the principal article of exportation"], ["650", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>i saw but few inhabitants during my excursion and i met a crowd of them actually drying and salting and roasting codfish, the principal article of exportation<|im_end|>", 0.34390777349472046, 0.75895094871521, "i saw but few inhabitants during my excursion but i met a crowd on the beach drying salting and loading codfish the principal article of exportation"], ["650", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>i saw but few inhabitants during my excursion and i met a crowd of them actually drying and salting and roasting codfish, the principal article of exportation<|im_end|>", 0.34390777349472046, 0.75895094871521, "i saw but few inhabitants during my excursion but i met a crowd on the beach drying salting and loading codfish the principal article of exportation"], ["650", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>i saw but few inhabitants during my excursion and i met a crowd of them actually drying and salting and roasting codfish the principal article of exportation<|im_end|>", 0.4490084648132324, 1.2141083478927612, "i saw but few inhabitants during my excursion but i met a crowd on the beach drying salting and loading codfish the principal article of exportation"], ["650", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>i saw but few inhabitants during my excursion, and i met a crowd of them actually dried and salted in loaded codfish, the principal article of exportation<|im_end|>", -0.09839683026075363, -1.1565287113189697, "i saw but few inhabitants during my excursion but i met a crowd on the beach drying salting and loading codfish the principal article of exportation"], ["650", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>i saw but few inhabitants during my excursion and i met a crowd of them actually dried and salted and loaded with codfish, the principal article of exportation<|im_end|>", 0.03567298501729965, -0.5759153366088867, "i saw but few inhabitants during my excursion but i met a crowd on the beach drying salting and loading codfish the principal article of exportation"], ["650", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>i saw but few inhabitants during my excursion and i met a crowd of them actually drying and salting and loading codfish, the principal article of exportation<|im_end|>", 0.450447678565979, 1.2203410863876343, "i saw but few inhabitants during my excursion but i met a crowd on the beach drying salting and loading codfish the principal article of exportation"], ["650", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>i saw but few inhabitants during my excursion and i met a crowd of them actually dried and salted and loaded in pot dishes the principal article of exportation<|im_end|>", -0.0665484219789505, -1.0186035633087158, "i saw but few inhabitants during my excursion but i met a crowd on the beach drying salting and loading codfish the principal article of exportation"], ["650", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>i saw but few inhabitants during my excursion and i met a crowd of them actually dried and salted and loaded with codfish, the principal article of exportation<|im_end|>", 0.03567298501729965, -0.5759153366088867, "i saw but few inhabitants during my excursion but i met a crowd on the beach drying salting and loading codfish the principal article of exportation"], ["650", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>i saw but few inhabitants during my excursion and i met a crowd of the actually dried and salted and loaded codfish, the principal article of exportation<|im_end|>", 0.23414531350135803, 0.28360486030578613, "i saw but few inhabitants during my excursion but i met a crowd on the beach drying salting and loading codfish the principal article of exportation"], ["650", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>i saw but few inhabitants during my excursion and i met a crowd of them actually dried and salted in woven pot dishes the principal article of exportation<|im_end|>", -0.07731880247592926, -1.06524658203125, "i saw but few inhabitants during my excursion but i met a crowd on the beach drying salting and loading codfish the principal article of exportation"], ["650", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>i saw but few inhabitants during my excursion and i met a crowd of them actually dried and salted in wooden pot dishes, the principal article of exportation<|im_end|>", -0.07705149054527283, -1.0640889406204224, "i saw but few inhabitants during my excursion but i met a crowd on the beach drying salting and loading codfish the principal article of exportation"], ["650", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>to allow her to derive encouragement from a preference only given her because her real situation was so different but that it was so probably declared by lucie's eyes on the trump that it was declared over in the next moment more evidently<|im_end|>", 0.18845127522945404, 0.42637088894844055, "or to allow her to derive encouragement from a preference only given her because her real situation was unknown but that it was so had not only been declared by lucy's eyes at the time but was declared over again the next morning more openly"], ["650", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>to allow marge and her rival encouragement with a preference only in it because her real situation was a thinner one, but that it was so probably been declared by lucy's eyes on the trumpet that it was declared over again next morning more evidently<|im_end|>", -0.10559716075658798, -1.9492686986923218, "or to allow her to derive encouragement from a preference only given her because her real situation was unknown but that it was so had not only been declared by lucy's eyes at the time but was declared over again the next morning more openly"], ["650", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>to allow her to derive encouragement from a preference only in her because her real situation was so different but that it was so probably been declared by lucy's eyes on the trump, that it was declared over again next morning more evidently<|im_end|>", 0.3131347894668579, 1.4336984157562256, "or to allow her to derive encouragement from a preference only given her because her real situation was unknown but that it was so had not only been declared by lucy's eyes at the time but was declared over again the next morning more openly"], ["650", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>to allow her to derive encouragement from a preference, only in her because her real situation was so different, but that it was so probably been declared by lucy's eyes on the triumph, that it was declared over again next morning more evidently<|im_end|>", 0.2516788840293884, 0.9371914863586426, "or to allow her to derive encouragement from a preference only given her because her real situation was unknown but that it was so had not only been declared by lucy's eyes at the time but was declared over again the next morning more openly"], ["650", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>to allow her to derive encouragement from a preference only in her because her own situation was so different but that it was so probably been declared by lucas eyes on the trumpet that it was declared over and over again more evidently<|im_end|>", 0.00036666117375716567, -1.0931788682937622, "or to allow her to derive encouragement from a preference only given her because her real situation was unknown but that it was so had not only been declared by lucy's eyes at the time but was declared over again the next morning more openly"], ["650", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>to allow her to derive encouragement from a preference only given her because her good situation was limited, but that it was so probably been declared by lucas eyes on the trump, that it was declared over in the next moment more evidently<|im_end|>", 0.2317005693912506, 0.7757852077484131, "or to allow her to derive encouragement from a preference only given her because her real situation was unknown but that it was so had not only been declared by lucy's eyes at the time but was declared over again the next morning more openly"], ["650", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>to allow her to derive encouragement from a preference only in her because her real situation was so different but that it was so probably been declared by lucy's eyes on the triumph then was declared over and an excellent evening more evident<|im_end|>", 0.17100711166858673, 0.2854381799697876, "or to allow her to derive encouragement from a preference only given her because her real situation was unknown but that it was so had not only been declared by lucy's eyes at the time but was declared over again the next morning more openly"], ["650", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>to allow her to derive encouragement from a preference only given her because her own situation was so thin but that it was so probably declared by lucy's eyes on trump that it was declared over in an excellent and warm oven.<|im_end|>", -0.01022692583501339, -1.1787652969360352, "or to allow her to derive encouragement from a preference only given her because her real situation was unknown but that it was so had not only been declared by lucy's eyes at the time but was declared over again the next morning more openly"], ["650", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>to allow her to derive encouragement from a preference only in her because her good situation was slender but that it was so probably been declared by lucas eyes on the trump then was declared over and annexed to even more evidently<|im_end|>", 0.09647921472787857, -0.31667831540107727, "or to allow her to derive encouragement from a preference only given her because her real situation was unknown but that it was so had not only been declared by lucy's eyes at the time but was declared over again the next morning more openly"], ["650", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>to allow her to derive encouragement from a preference, only in her because her own situation was so limited, but that it was so probably been declared by lucy's eyes on the trump, and was declared over again next morning more evidently<|im_end|>", 0.23830121755599976, 0.8291123509407043, "or to allow her to derive encouragement from a preference only given her because her real situation was unknown but that it was so had not only been declared by lucy's eyes at the time but was declared over again the next morning more openly"], ["650", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>to allow her to derive encouragement from a preference only in her because her real situation was so thin but that it was so probably been declared by lucy's eyes on the truant that it was declared over evident and explained more evidently<|im_end|>", 0.12768252193927765, -0.06458445638418198, "or to allow her to derive encouragement from a preference only given her because her real situation was unknown but that it was so had not only been declared by lucy's eyes at the time but was declared over again the next morning more openly"], ["650", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>to allow her to derive encouragement from a preference only in her because her real situation was so different but that it was so probably been declared by lucy's eyes on the trumpet, that it was declared over and an excellently more evidently<|im_end|>", 0.12514056265354156, -0.08512113988399506, "or to allow her to derive encouragement from a preference only given her because her real situation was unknown but that it was so had not only been declared by lucy's eyes at the time but was declared over again the next morning more openly"], ["650", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>In a very short time, you would have laughed to a song if I saw yesterday Emmett did not know whether she was on her head or heels in such a hurry to tell him great news.<|im_end|>", 0.44709184765815735, -1.250040054321289, "In a very short time. You would have laughed to have seen what I saw yesterday. Emma did not know whether she was on her head or heels. In such a hurry to tell your great news."], ["650", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>In a very short time, you would have laughed to your sin if I saw yesterday Emmet did not know whether she was on her head or hands in such a hurry to tell you great news.<|im_end|>", 0.4470624029636383, -1.2503377199172974, "In a very short time. You would have laughed to have seen what I saw yesterday. Emma did not know whether she was on her head or heels. In such a hurry to tell your great news."], ["650", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>In a very short time you would have laughed to your sin if I saw yesterday Emmet did not know whether she was on her head or heels in such a hurry to tell you great news.<|im_end|>", 0.4515860378742218, -1.2046061754226685, "In a very short time. You would have laughed to have seen what I saw yesterday. Emma did not know whether she was on her head or heels. In such a hurry to tell your great news."], ["650", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>In a very short time, you would have laughed to see what I saw yesterday. Emmett did not know whether she was on her head or heels in such a hurry to tell your great news.<|im_end|>", 0.6924002766609192, 1.229895830154419, "In a very short time. You would have laughed to have seen what I saw yesterday. Emma did not know whether she was on her head or heels. In such a hurry to tell your great news."], ["650", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>In a very short time, you would have laughed to your sin that I saw yesterday. Emmet did not know whether she was on her head or thumbs in such a hurry to tell you great news.<|im_end|>", 0.5242686867713928, -0.4698238670825958, "In a very short time. You would have laughed to have seen what I saw yesterday. Emma did not know whether she was on her head or heels. In such a hurry to tell your great news."], ["650", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>In a very short time, you would have laughed to see what I saw yesterday. Emmet did not know whether she was on her head or heels in such a hurry to tell him great news.<|im_end|>", 0.6197176575660706, 0.4951137602329254, "In a very short time. You would have laughed to have seen what I saw yesterday. Emma did not know whether she was on her head or heels. In such a hurry to tell your great news."], ["650", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>In a very short time, you would have laughed to hear some of how I saw yesterday. Emmet did not know whether she was on her head or heels in such a hurry to tell your great news.<|im_end|>", 0.5412817597389221, -0.29783087968826294, "In a very short time. You would have laughed to have seen what I saw yesterday. Emma did not know whether she was on her head or heels. In such a hurry to tell your great news."], ["650", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>In a very short time, you would have laughed to listen to what I saw yesterday. Emmet did not know whether she was on her head or thumbs in such a hurry to tell your great news.<|im_end|>", 0.6698590517044067, 1.0020161867141724, "In a very short time. You would have laughed to have seen what I saw yesterday. Emma did not know whether she was on her head or heels. In such a hurry to tell your great news."], ["650", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>In a very short time, you would have laughed to your sin that I saw yesterday. Emmett did not know whether she was on her head or heels in such a hurry to tell him great news.<|im_end|>", 0.52790766954422, -0.4330357015132904, "In a very short time. You would have laughed to have seen what I saw yesterday. Emma did not know whether she was on her head or heels. In such a hurry to tell your great news."], ["650", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>In a very short time, you would have laughed to see what I saw yesterday. Emmet did not know whether she was on her head or heels in such a hurry to tell your great news.<|im_end|>", 0.693012535572052, 1.2360854148864746, "In a very short time. You would have laughed to have seen what I saw yesterday. Emma did not know whether she was on her head or heels. In such a hurry to tell your great news."], ["650", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>In a very short time, you would have laughed to see what I saw yesterday. Emmet did not know whether she was on her head or heels in such a hurry to tell your great news.<|im_end|>", 0.693012535572052, 1.2360854148864746, "In a very short time. You would have laughed to have seen what I saw yesterday. Emma did not know whether she was on her head or heels. In such a hurry to tell your great news."], ["650", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>In a very short time, you would have laughed to a sing of how I saw yesterday. Emmet did not know whether she was on her head or heels in such a hurry to tell your great news.<|im_end|>", 0.5417073369026184, -0.2935284972190857, "In a very short time. You would have laughed to have seen what I saw yesterday. Emma did not know whether she was on her head or heels. In such a hurry to tell your great news."]]}
wandb/run-20260418_172847-c2a5hfz3/files/media/table/completions_331_10c4aed0f625c56bd04d.table.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"columns": ["step", "prompt", "completion", "ASRWerSubLenCmpHalluDirtyV56", "advantages", "solution"], "data": [["660", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Captain marking, it's about about my wife. Polly answered, casting down her eyes and returning very red. The other gave a whistle.<|im_end|>", 0.5489940643310547, 0.10889305174350739, "Captain marker, it's about about my wife. Crawley answered, casting down his eyes and turning very red. The other gave a whistle."], ["660", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Captain marten, it's about about my wife. Crawley answered, casting down his eyes and returning a very red. The other gave a whistle.<|im_end|>", 0.7004733681678772, 1.3730005025863647, "Captain marker, it's about about my wife. Crawley answered, casting down his eyes and turning very red. The other gave a whistle."], ["660", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Captain marten, it's about about my wife. Crawley answered, casting down his eyes and returning a very red. The other day, the whistle.<|im_end|>", 0.4469512701034546, -0.7426625490188599, "Captain marker, it's about about my wife. Crawley answered, casting down his eyes and turning very red. The other gave a whistle."], ["660", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Captain markham, it's about about my wife. Crawley answered, casting down his eyes and returning a very red. The other day, the whistle.<|im_end|>", 0.44736266136169434, -0.7392294406890869, "Captain marker, it's about about my wife. Crawley answered, casting down his eyes and turning very red. The other gave a whistle."], ["660", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>At evening upon the world, while others hint that knowledge of these might undo our civilization, there watched him ceaselessly from the underpits those eyes whose duty it is, from further within and deeper.<|im_end|>", 0.8165187239646912, -1.213279128074646, "At evening upon the world, while others hint that knowledge of these might undo our civilization, there watched him ceaselessly from the under pits, those eyes whose duty it is from further within and deeper."], ["660", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>At evening upon the world, while others hint that knowledge of these might undo our civilization, there watched him ceaselessly from the under pits those eyes whose duty it is from further within and deeper.<|im_end|>", 0.9336058497428894, 1.213279128074646, "At evening upon the world, while others hint that knowledge of these might undo our civilization, there watched him ceaselessly from the under pits, those eyes whose duty it is from further within and deeper."], ["660", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>At evening upon the world, while others hint that knowledge of these might undo our civilization, there watched him ceaselessly from the underpits those eyes whose duty it is from further within and deeper.<|im_end|>", 0.8821772933006287, 0.14745411276817322, "At evening upon the world, while others hint that knowledge of these might undo our civilization, there watched him ceaselessly from the under pits, those eyes whose duty it is from further within and deeper."], ["660", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>At evening upon the world, while others hint that knowledge of these might undo our civilization, there watched him ceaselessly from the under pits those eyes whose duty it is, from further within and deeper.<|im_end|>", 0.8679472804069519, -0.14745411276817322, "At evening upon the world, while others hint that knowledge of these might undo our civilization, there watched him ceaselessly from the under pits, those eyes whose duty it is from further within and deeper."], ["660", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Milly steered her magnificent way like some great liner cleaving among the canoes of howling savages. Our goddess of grub was built on lines so majestic that they could be followed only with awe.<|im_end|>", 1.0, 0.0, "Milly steered her magnificent way like some great liner cleaving among the canoes of howling savages. Our goddess of grub was built on lines so majestic that they could be followed only with awe."], ["660", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Milly steered her magnificent way like some great liner cleaving among the canoes of howling savages. Our goddess of grub was built on lines so majestic that they could be followed only with awe.<|im_end|>", 1.0, 0.0, "Milly steered her magnificent way like some great liner cleaving among the canoes of howling savages. Our goddess of grub was built on lines so majestic that they could be followed only with awe."], ["660", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Milly steered her magnificent way like some great liner cleaving among the canoes of howling savages. Our goddess of grub was built on lines so majestic that they could be followed only with awe.<|im_end|>", 1.0, 0.0, "Milly steered her magnificent way like some great liner cleaving among the canoes of howling savages. Our goddess of grub was built on lines so majestic that they could be followed only with awe."], ["660", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Milly steered her magnificent way like some great liner cleaving among the canoes of howling savages. Our goddess of grub was built on lines so majestic that they could be followed only with awe.<|im_end|>", 1.0, 0.0, "Milly steered her magnificent way like some great liner cleaving among the canoes of howling savages. Our goddess of grub was built on lines so majestic that they could be followed only with awe."], ["660", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>And make properly lavish time after working hard, it is not improbable that glossy buttons are a valid feature of the garb of a humdrum and harassed hospital portmanteau many intellect.<|im_end|>", 0.26788923144340515, -1.226920247077942, "And may properly lavish time and trouble thereupon. It is not arguable that glossy buttons are a valid feature of the garb of a humdrum and harassed hospital, orderly many a time."], ["660", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>And may properly lavish time and sport upon it is not improbable that glossy buttons are a valid feature of the garb of a humdrum and harassed hospital superintendent many intellect<|im_end|>", 0.4479951858520508, 1.2192050218582153, "And may properly lavish time and trouble thereupon. It is not arguable that glossy buttons are a valid feature of the garb of a humdrum and harassed hospital, orderly many a time."], ["660", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>And may properly lavish time after working hard. It is not improbable that glossy buttons are a valid feature of the garb of a humdrum and harassed hospital employee many intellect.<|im_end|>", 0.35821354389190674, -0.00017242900503333658, "And may properly lavish time and trouble thereupon. It is not arguable that glossy buttons are a valid feature of the garb of a humdrum and harassed hospital, orderly many a time."], ["660", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>And may properly lavish time and sport upon it is not improbable that glossy buttons are a valid feature of the garb of a humdrum and grassy hospital porter many intellect.<|im_end|>", 0.35880690813064575, 0.007886400446295738, "And may properly lavish time and trouble thereupon. It is not arguable that glossy buttons are a valid feature of the garb of a humdrum and harassed hospital, orderly many a time."], ["660", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>And Shahrazad perceived the dawn of day and ceased saying her permitted say, when it was the six hundred and seventy seventh night she pursued, it hath reached me o auspicious king that when the kafirs fell upon harib.<|im_end|>", 0.6396347880363464, 0.0463232584297657, "And shahrazad perceived the dawn of day and ceased saying her permitted say. When it was the six hundred and seventy seventh night, she pursued it. Hath reached me o auspicious king, that when the kafirs fell upon gharib."], ["660", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>And Shahrazad perceived the dawn of day and ceased saying her permitted say, when it was the six hundred and seventy seventh night she pursued, it hath reached me o auspicious king that when the kaffirs fell upon harib.<|im_end|>", 0.5678775310516357, -1.2670694589614868, "And shahrazad perceived the dawn of day and ceased saying her permitted say. When it was the six hundred and seventy seventh night, she pursued it. Hath reached me o auspicious king, that when the kafirs fell upon gharib."], ["660", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>And Shahrazad perceived the dawn of day and ceased saying her permitted say, when it was the six hundred and seventy seventh night, she pursued. It hath reached me, O auspicious king, that when the kafirs fell upon Harib.<|im_end|>", 0.7012686133384705, 1.1744240522384644, "And shahrazad perceived the dawn of day and ceased saying her permitted say. When it was the six hundred and seventy seventh night, she pursued it. Hath reached me o auspicious king, that when the kafirs fell upon gharib."], ["660", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>And Shahrazad perceived the dawn of day and ceased saying her permitted say, when it was the six hundred and seventy seventh night she pursued. It hath reached me o auspicious king that when the kafirs fell upon harib.<|im_end|>", 0.6396347880363464, 0.0463232584297657, "And shahrazad perceived the dawn of day and ceased saying her permitted say. When it was the six hundred and seventy seventh night, she pursued it. Hath reached me o auspicious king, that when the kafirs fell upon gharib."], ["660", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>these he would make reply but was from a certain person whom perhaps we need not name then the whiskey bottle would move forward like a pawn in chess and the next soothing words would be<|im_end|>", 0.8178245425224304, 0.502872109413147, "deasey would make reply but twas from a certain person whom perhaps we need not name then the whiskey bottle would move forward like a pawn in chess and the next soothing words would be"], ["660", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>beasy would make reply but was from a certain person whom perhaps we need not name then the whiskey bottle would move forward like a pawn in chess and the next soothing words would be<|im_end|>", 0.8717525601387024, 0.8038002252578735, "deasey would make reply but twas from a certain person whom perhaps we need not name then the whiskey bottle would move forward like a pawn in chess and the next soothing words would be"], ["660", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>these he would make reply but was from a certain person whom perhaps we need not name then the whiskey bottle would move forward like upon in chest and the next soothing words repeat<|im_end|>", 0.4692924916744232, -1.4420000314712524, "deasey would make reply but twas from a certain person whom perhaps we need not name then the whiskey bottle would move forward like a pawn in chess and the next soothing words would be"], ["660", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>these he would make reply but was from a certain person whom perhaps we need not name then the whiskey bottle would move forward like a pawn in chess and the next suiting words would be<|im_end|>", 0.7519586086273193, 0.13532821834087372, "deasey would make reply but twas from a certain person whom perhaps we need not name then the whiskey bottle would move forward like a pawn in chess and the next soothing words would be"], ["660", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>He did, in fact, begin it when setting out on the aforementioned second trip to Europe, calling it.<|im_end|>", 1.0, 0.49922850728034973, "He did, in fact, begin it when setting out on the aforementioned second trip to europe, calling it."], ["660", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>He did, in fact, begin it when setting out on the aforementioned second trip to Europe, calling it.<|im_end|>", 1.0, 0.49922850728034973, "He did, in fact, begin it when setting out on the aforementioned second trip to europe, calling it."], ["660", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>He did, in fact, begin it when setting out on the aforementioned second trip to Europe, calling it.<|im_end|>", 1.0, 0.49922850728034973, "He did, in fact, begin it when setting out on the aforementioned second trip to europe, calling it."], ["660", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>He did, in fact begin it when setting out on the aforementioned second trip to Europe, calling it.<|im_end|>", 0.8706542253494263, -1.4976837635040283, "He did, in fact, begin it when setting out on the aforementioned second trip to europe, calling it."], ["660", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Bayard knew that his master was upon him, and he started off upon a rapid pace. And in a few moments, he had good run up. Malagigi pretended to be in great alarm. O noble king and master, he cried, my poor companion has run away with. He will fall and break his neck.<|im_end|>", 0.4922104775905609, -0.6293519735336304, "Bayard knew that his master was upon him, and he started off upon a rapid pace, and in a few moments was a good way off. Malagigi pretended to be in great alarm o, noble king and master. He cried, my poor companion is run away with he will fall and break his neck."], ["660", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Bayard knew that his master was upon him, and he started off upon a rapid pace. And in a few moments, he had galloped away. Malagigi pretended to be in great alarm. O noble king and master, he cried, my poor companion has run away with me. He will fall and break his neck.<|im_end|>", 0.4565129280090332, -1.024836540222168, "Bayard knew that his master was upon him, and he started off upon a rapid pace, and in a few moments was a good way off. Malagigi pretended to be in great alarm o, noble king and master. He cried, my poor companion is run away with he will fall and break his neck."], ["660", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Bayard knew that his master was upon him, and he started off upon a rapid pace. And in a few moments of a good way up. Malagigi pretended to be in great alarm. O noble king and master, he cried, my poor companion has run away with. He will fall and break his neck.<|im_end|>", 0.6506629586219788, 1.1261051893234253, "Bayard knew that his master was upon him, and he started off upon a rapid pace, and in a few moments was a good way off. Malagigi pretended to be in great alarm o, noble king and master. He cried, my poor companion is run away with he will fall and break his neck."], ["660", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Bayard knew that his master was upon him, and he started off upon a rapid pace. And in a few moments of a good run up, Malagigi pretended to be in great alarm. O noble king and master, he cried, my poor companion has run away with. He will fall and break his neck.<|im_end|>", 0.5966837406158447, 0.5280823707580566, "Bayard knew that his master was upon him, and he started off upon a rapid pace, and in a few moments was a good way off. Malagigi pretended to be in great alarm o, noble king and master. He cried, my poor companion is run away with he will fall and break his neck."], ["660", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>She laid a firm, delicate hand on her gold green jerkin. Ellador, this was pleasant, but we got no nearer. We can't sit here and learn the language. Terry protested.<|im_end|>", 1.0, 1.3054163455963135, "She laid a firm, delicate hand on her gold green jerkin. Ellador, this was pleasant, but we got no nearer. We can't sit here and learn the language. Terry protested."], ["660", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>She laid a firm, delicate hand on her gold green jerkin ellador. This was pleasant, but we got no nearer. We can't sit here and learn the language. Terry protested.<|im_end|>", 0.8441234230995178, -0.7815061807632446, "She laid a firm, delicate hand on her gold green jerkin. Ellador, this was pleasant, but we got no nearer. We can't sit here and learn the language. Terry protested."], ["660", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>She laid a firm, delicate hand on her gold green jerkin. Ellador. This was pleasant, but we got no nearer. We can't sit here and learn the language. Terry protested.<|im_end|>", 0.9217362999916077, 0.2575983703136444, "She laid a firm, delicate hand on her gold green jerkin. Ellador, this was pleasant, but we got no nearer. We can't sit here and learn the language. Terry protested."], ["660", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>She laid a firm, delicate hand on her gold green jerkin ellador. This was pleasant, but we got no nearer. We can't sit here and learn the language. Terry protested.<|im_end|>", 0.8441234230995178, -0.7815061807632446, "She laid a firm, delicate hand on her gold green jerkin. Ellador, this was pleasant, but we got no nearer. We can't sit here and learn the language. Terry protested."], ["660", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>he cried out sadly and fought and struggled two minutes however he did little against his tormentors and worn out with his struggle plats suddenly went from dusty boy with emotion in his spirit lost lost he muttered all lost<|im_end|>", -0.15980112552642822, -0.0070180995389819145, "he cried out savagely and fought with the strength of two men however he could do little against his four adversaries and worn out with the struggle collapsed suddenly on to the dusty floor with a motion of despair lost lost he muttered all lost"], ["660", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>he cried out sadly and fought and struggled two minutes however he did little against his tormentors and worn out with his struggle platt suddenly on the dusty floor with emotion in his spirit lost lost he muttered all lost<|im_end|>", 0.03230888023972511, 0.7638584971427917, "he cried out savagely and fought with the strength of two men however he could do little against his four adversaries and worn out with the struggle collapsed suddenly on to the dusty floor with a motion of despair lost lost he muttered all lost"], ["660", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>he cried out sadly and fought and struggled to win it however he did little against his tormentors and wore down with his struggle plaid suddenly went from dusty boy with emotion in his spirit lost, lost, he muttered all lost<|im_end|>", -0.5093984603881836, -1.409841537475586, "he cried out savagely and fought with the strength of two men however he could do little against his four adversaries and worn out with the struggle collapsed suddenly on to the dusty floor with a motion of despair lost lost he muttered all lost"], ["660", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>he cried out sadly and fought and struggled two minutes however he did little against four adversaries and worn out with his struggle clapp suddenly on the dusty floor in motionless terror lost lost he muttered all lost<|im_end|>", 0.004682107362896204, 0.653001070022583, "he cried out savagely and fought with the strength of two men however he could do little against his four adversaries and worn out with the struggle collapsed suddenly on to the dusty floor with a motion of despair lost lost he muttered all lost"], ["660", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>and thus he accomplished this by the bye during the siege of the city, for he had his enemies in great contempt already nine when he had thus married mariamne.<|im_end|>", 0.715508222579956, 0.49875012040138245, "And thus he accomplished this by the by, during the siege of the city. For he had his enemies in great contempt already nine when he had thus married mariamne, he."], ["660", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>and thus he accomplished this by the bye during the siege of the city, for he had his enemies in great contempt already nine when he had thus married mariamne.<|im_end|>", 0.715508222579956, 0.49875012040138245, "And thus he accomplished this by the by, during the siege of the city. For he had his enemies in great contempt already nine when he had thus married mariamne, he."], ["660", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>And thus he accomplished this by the bye during the siege of the city, for he had his enemies in great contempt already. Nine when he had thus married Mariamne.<|im_end|>", 0.6356512308120728, -1.4962533712387085, "And thus he accomplished this by the by, during the siege of the city. For he had his enemies in great contempt already nine when he had thus married mariamne, he."], ["660", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>and thus he accomplished this by the bye during the siege of the city, for he had his enemies in great contempt already nine when he had thus married mariamne.<|im_end|>", 0.715508222579956, 0.49875012040138245, "And thus he accomplished this by the by, during the siege of the city. For he had his enemies in great contempt already nine when he had thus married mariamne, he."], ["660", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Putting both hands on her shoulders and looking into the brown eyes, should you be willing to go abroad with your mother and phronsie? Mister king and jasper oh polly gasped but you.<|im_end|>", 0.7173033952713013, -0.7722386121749878, "Putting both hands on her shoulders and looking into the brown eyes, should you be willing to go abroad with your mother and phronsie, mister king and jasper? Oh, polly gasped, but you."], ["660", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Putting both hands on her shoulders and looking into the brown eyes, should you be willing to go abroad with your mother and phronsie? Mister king and jasper. Oh Polly gasped. But you.<|im_end|>", 0.7161594033241272, -0.7890278100967407, "Putting both hands on her shoulders and looking into the brown eyes, should you be willing to go abroad with your mother and phronsie, mister king and jasper? Oh, polly gasped, but you."], ["660", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Putting both hands on her shoulders and looking into the brown eyes, should you be willing to go abroad with your mother and phronsie? Mister king and jasper. Oh Polly gasped, but you.<|im_end|>", 0.7872677445411682, 0.25455793738365173, "Putting both hands on her shoulders and looking into the brown eyes, should you be willing to go abroad with your mother and phronsie, mister king and jasper? Oh, polly gasped, but you."], ["660", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Putting both hands on her shoulders and looking into the brown eyes, should you be willing to go abroad with your mother and phronsie, mister king and jasper? Oh Polly gasped but you.<|im_end|>", 0.8589596152305603, 1.3067076206207275, "Putting both hands on her shoulders and looking into the brown eyes, should you be willing to go abroad with your mother and phronsie, mister king and jasper? Oh, polly gasped, but you."]]}
wandb/run-20260418_172847-c2a5hfz3/files/media/table/completions_335_3461640c297d6819a123.table.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"columns": ["step", "prompt", "completion", "ASRWerSubLenCmpHalluDirtyV56", "advantages", "solution"], "data": [["670", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Are any other beings ever found in such masses but armor, anus, scaly and naked? Look at them.<|im_end|>", 0.10128102451562881, 0.9727044701576233, "Are any other beings ever found in such masses? But vermin, aimless, staring, vacant minded. Look at them."], ["670", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Are any other beings ever found in such masses of iron, anus, stone and great granite? Look at them.<|im_end|>", -0.21537110209465027, -0.9686115980148315, "Are any other beings ever found in such masses? But vermin, aimless, staring, vacant minded. Look at them."], ["670", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Are any other beings ever found in such masses but armor, anus, scale and great and round? Look at them.<|im_end|>", -0.17419415712356567, -0.7161659002304077, "Are any other beings ever found in such masses? But vermin, aimless, staring, vacant minded. Look at them."], ["670", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Are any other beings ever found in such masses but iron, a mis, stone? Great and grand. Look at them.<|im_end|>", -0.16917581856250763, -0.6853997111320496, "Are any other beings ever found in such masses? But vermin, aimless, staring, vacant minded. Look at them."], ["670", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Are any other beings ever found in such masses of iron, anus, stone and great granite? Look at them.<|im_end|>", -0.21537110209465027, -0.9686115980148315, "Are any other beings ever found in such masses? But vermin, aimless, staring, vacant minded. Look at them."], ["670", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Are any other beings ever found in such masses, but armor? Anus, scaly and naked. Look at them.<|im_end|>", 0.10200562328100204, 0.9771468043327332, "Are any other beings ever found in such masses? But vermin, aimless, staring, vacant minded. Look at them."], ["670", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Are any other beings ever found in such masses, but armor, anus, scale and great and round it? Look at them.<|im_end|>", -0.35615864396095276, -1.8317453861236572, "Are any other beings ever found in such masses? But vermin, aimless, staring, vacant minded. Look at them."], ["670", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Are any other beings ever found in such masses but armor, anus, scaly and naked? Look at them.<|im_end|>", 0.10128102451562881, 0.9727044701576233, "Are any other beings ever found in such masses? But vermin, aimless, staring, vacant minded. Look at them."], ["670", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Are any other beings ever found in such masses but armor, anus, stamen and great gland? Look at them.<|im_end|>", -0.035287097096443176, 0.13543902337551117, "Are any other beings ever found in such masses? But vermin, aimless, staring, vacant minded. Look at them."], ["670", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Are any other beings ever found in such masses but armor, anus, scaly and naked minded? Look at them.<|im_end|>", -0.028729775920510292, 0.17564034461975098, "Are any other beings ever found in such masses? But vermin, aimless, staring, vacant minded. Look at them."], ["670", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Are any other beings ever found in such masses but armor anus, scaly and naked? Look at them.<|im_end|>", 0.09989295154809952, 0.9641945362091064, "Are any other beings ever found in such masses? But vermin, aimless, staring, vacant minded. Look at them."], ["670", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Are any other beings ever found in such masses but armor, anus, scaly and naked? Look at them.<|im_end|>", 0.10128102451562881, 0.9727044701576233, "Are any other beings ever found in such masses? But vermin, aimless, staring, vacant minded. Look at them."], ["670", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>in which both of them seated without either audience for nothing had been said on either side between them to slight each other less than they had done before and elizabeth asked her parting with a melancholy persuasion that edward was not only without affection for the person who was to be his bride<|im_end|>", 0.2575233578681946, 0.4609338343143463, "to which both of them submitted without any reluctance for nothing had been said on either side to make them dislike each other less than they had done before and elinor sat down to the card table with the melancholy persuasion that edward was not only without affection for the person who was to be his wife"], ["670", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>in which both of them seated without either audience for nothing it could be said on either side that they disliked each other less than they had done before and elizabeth asked for parting with a melancholy persuasion that edward was not only without affection for the person who was to be his bride<|im_end|>", 0.1251828372478485, -1.8440135717391968, "to which both of them submitted without any reluctance for nothing had been said on either side to make them dislike each other less than they had done before and elinor sat down to the card table with the melancholy persuasion that edward was not only without affection for the person who was to be his wife"], ["670", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>in which both of them seated without either audience for nothing it can say on either side had made them dislike each other less than they had done before and elizabeth asked her partake with a melancholy persuasion that edward was not only without affection for the person who was his wife<|im_end|>", 0.17267856001853943, -1.0167903900146484, "to which both of them submitted without any reluctance for nothing had been said on either side to make them dislike each other less than they had done before and elinor sat down to the card table with the melancholy persuasion that edward was not only without affection for the person who was to be his wife"], ["670", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>in which both of them sitted without either utterance for nothing had been said on either side except from dislike each other less than they had done before and elizabeth asked her partaker with a melancholy persuasion that edward was not only without affection for the person who was speaking his mind<|im_end|>", 0.21673797070980072, -0.249416783452034, "to which both of them submitted without any reluctance for nothing had been said on either side to make them dislike each other less than they had done before and elinor sat down to the card table with the melancholy persuasion that edward was not only without affection for the person who was to be his wife"], ["670", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>in which both of them seated without either audience for nothing had been said on either side except from dislike each other less than they had done before and elizabeth asked her parting with a melancholy persuasion that edward was not only without affection for the person who was his wife<|im_end|>", 0.26496413350105286, 0.5905282497406006, "to which both of them submitted without any reluctance for nothing had been said on either side to make them dislike each other less than they had done before and elinor sat down to the card table with the melancholy persuasion that edward was not only without affection for the person who was to be his wife"], ["670", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>in which both of them seated without either audience for nothing it could said on either side made them dislike each other less than they had done before and elizabeth asked for parting with a melancholy persuasion that edward was not only without affection for the person who was to be his bride<|im_end|>", 0.26157763600349426, 0.5315463542938232, "to which both of them submitted without any reluctance for nothing had been said on either side to make them dislike each other less than they had done before and elinor sat down to the card table with the melancholy persuasion that edward was not only without affection for the person who was to be his wife"], ["670", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>in which both of them seated without either audience for nothing it had said on either side made them dislike each other less than they had done before and elizabeth asked her partaking with a melancholy persuasion that edward was not only without affection for the person who was to be his bride<|im_end|>", 0.26304858922958374, 0.5571656227111816, "to which both of them submitted without any reluctance for nothing had been said on either side to make them dislike each other less than they had done before and elinor sat down to the card table with the melancholy persuasion that edward was not only without affection for the person who was to be his wife"], ["670", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>in which both of them succeeded without either arguments for nothing it had said on either side could make them dislike each other less than they had done before and elizabeth asked her parting with a melancholy resiliation that edward was not only without affection for the person who was keeping his mind<|im_end|>", 0.1625610888004303, -1.1930042505264282, "to which both of them submitted without any reluctance for nothing had been said on either side to make them dislike each other less than they had done before and elinor sat down to the card table with the melancholy persuasion that edward was not only without affection for the person who was to be his wife"], ["670", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>in which both of them seated without either audience for nothing had been said on either side except in dislike each other less than they had done before and elizabeth asked her partake with a melancholy persuasion that edward was not only without affection for the person who was to be his bride<|im_end|>", 0.30962347984313965, 1.368350863456726, "to which both of them submitted without any reluctance for nothing had been said on either side to make them dislike each other less than they had done before and elinor sat down to the card table with the melancholy persuasion that edward was not only without affection for the person who was to be his wife"], ["670", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>in which both of them sitted without either audience for nothing had been said on either side except what was like each other less than they had done before and elizabeth asked her partaking with a melancholy persuasion that edward was not only without affection for the person who was his wife<|im_end|>", 0.21824409067630768, -0.2231850028038025, "to which both of them submitted without any reluctance for nothing had been said on either side to make them dislike each other less than they had done before and elinor sat down to the card table with the melancholy persuasion that edward was not only without affection for the person who was to be his wife"], ["670", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>in which both of them seated without either audience for nothing had been said on either side except from dislike each other less than they had done before nelly lost asked to partake with a melancholy persuasion that edward was not only without affection for the person who was to be his bride<|im_end|>", 0.30912715196609497, 1.3597064018249512, "to which both of them submitted without any reluctance for nothing had been said on either side to make them dislike each other less than they had done before and elinor sat down to the card table with the melancholy persuasion that edward was not only without affection for the person who was to be his wife"], ["670", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>in which both of them succeeded without either audience for nothing had been said on either side between the sight each other less than they had done before and elizabeth asked her parting with a melancholy resiliation that edward was not only without affection for the person who was to be his bride<|im_end|>", 0.2114323079586029, -0.34182441234588623, "to which both of them submitted without any reluctance for nothing had been said on either side to make them dislike each other less than they had done before and elinor sat down to the card table with the melancholy persuasion that edward was not only without affection for the person who was to be his wife"], ["670", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>And they've just been ordered a small pot of ginger, then please, said Barbara quickly. Will you send it round immediately? Yes, ma'am. The boy's just going out. Thank you, ma'am.<|im_end|>", 0.4192619323730469, 1.2368416786193848, "And they've just been ordered a small pot of ginger then, please, said diva, recklessly. Will you send it round immediately? Yes, ma'am. The boy's just going out. That was luck."], ["670", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>And they've just been ordered a small pot of ginger, then please. Without a requisition. Will you send it round immediately? Yes, ma'am. The boys just going out. That's what.<|im_end|>", 0.15900462865829468, -0.6233274340629578, "And they've just been ordered a small pot of ginger then, please, said diva, recklessly. Will you send it round immediately? Yes, ma'am. The boy's just going out. That was luck."], ["670", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>And they've just been ordered a small pot of ginger then, please, if I'd rather have it sweet? Will you send it round immediately? Yes, ma'am. The boy's just going out. That'll be about.<|im_end|>", 0.27937445044517517, 0.23700663447380066, "And they've just been ordered a small pot of ginger then, please, said diva, recklessly. Will you send it round immediately? Yes, ma'am. The boy's just going out. That was luck."], ["670", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>And they've just been ordered a small pot of ginger, then please, said Datterley softly. Will you send it round immediately? Yes, ma'am. The boys just going out. Thank you, mother.<|im_end|>", 0.32857972383499146, 0.5886975526809692, "And they've just been ordered a small pot of ginger then, please, said diva, recklessly. Will you send it round immediately? Yes, ma'am. The boy's just going out. That was luck."], ["670", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>And that's just been ordered a small pot of ginger, then please, without a requisition. Will you send it round immediately? Yes, ma'am. The boys just going out. That is well.<|im_end|>", 0.22822655737400055, -0.12856899201869965, "And they've just been ordered a small pot of ginger then, please, said diva, recklessly. Will you send it round immediately? Yes, ma'am. The boy's just going out. That was luck."], ["670", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>And they've just been ordered a small pot of ginger, then please. I'd rather have it soon. Will you send it round immediately? Yes, ma'am. The boy's just going out. Thank you, ma'am.<|im_end|>", 0.08186985552310944, -1.1746423244476318, "And they've just been ordered a small pot of ginger then, please, said diva, recklessly. Will you send it round immediately? Yes, ma'am. The boy's just going out. That was luck."], ["670", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>And they've just been ordered a small pot of ginger, then please said datterley quickly. Will you send it round immediately? Yes, ma'am. The boy's just going out. Thank you. Well.<|im_end|>", 0.33202850818634033, 0.6133474707603455, "And they've just been ordered a small pot of ginger then, please, said diva, recklessly. Will you send it round immediately? Yes, ma'am. The boy's just going out. That was luck."], ["670", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>And that's just been ordered a small pot of ginger, then please. What about a recipe? Will you send it round immediately? Yes, ma'am. The boys just going out. Thank you. Well.<|im_end|>", -0.03146732226014137, -1.9847110509872437, "And they've just been ordered a small pot of ginger then, please, said diva, recklessly. Will you send it round immediately? Yes, ma'am. The boy's just going out. That was luck."], ["670", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>And they've just been ordered a small pot of ginger, then please if that'll reconcile. Will you send it round immediately? Yes, ma'am. The boy's just going out. Thank you, ma'am.<|im_end|>", 0.23466002941131592, -0.08258624374866486, "And they've just been ordered a small pot of ginger then, please, said diva, recklessly. Will you send it round immediately? Yes, ma'am. The boy's just going out. That was luck."], ["670", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>And that's just been ordered a small pot of ginger, then please without a recipe. Will you send it round immediately? Yes, ma'am. The boy's just going out. Thank you, papa.<|im_end|>", 0.14090721309185028, -0.752677321434021, "And they've just been ordered a small pot of ginger then, please, said diva, recklessly. Will you send it round immediately? Yes, ma'am. The boy's just going out. That was luck."], ["670", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>And they've just been ordered a small pot of ginger, then please, said the doctor rapidly. Will you send it round immediately? Yes, ma'am, the boy's just going out. That is well.<|im_end|>", 0.34315091371536255, 0.692844033241272, "And they've just been ordered a small pot of ginger then, please, said diva, recklessly. Will you send it round immediately? Yes, ma'am. The boy's just going out. That was luck."], ["670", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>And they've just been ordered a small pot of ginger, then please, said datterley hastily. Will you send it round immediately? Yes, ma'am. The boy's just going out. That's well.<|im_end|>", 0.4389801323413849, 1.377776026725769, "And they've just been ordered a small pot of ginger then, please, said diva, recklessly. Will you send it round immediately? Yes, ma'am. The boy's just going out. That was luck."], ["670", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>I don't want to be you, for I am not, and yet there is one thing that I forbear to mourn them.<|im_end|>", -1.3294343948364258, -1.4924614429473877, "You don't believe it, do you? Watson, no, no. And yet, it was one thing to laugh about it in london."], ["670", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>He demanded, \"Do you have a hat?\". I had one, and yet there was one thing that I forgot to mention.<|im_end|>", -1.2909154891967773, -1.3791276216506958, "You don't believe it, do you? Watson, no, no. And yet, it was one thing to laugh about it in london."], ["670", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>He declared to you, of course, I am here and yet there is one thing to laugh about in London.<|im_end|>", -0.8068205714225769, 0.04522077739238739, "You don't believe it, do you? Watson, no, no. And yet, it was one thing to laugh about it in london."], ["670", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>He did not believe it, and yet there was one thing to laugh about in London.<|im_end|>", -0.3995647430419922, 1.2434861660003662, "You don't believe it, do you? Watson, no, no. And yet, it was one thing to laugh about it in london."], ["670", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>He thought, but he knew of it all, and yet there was one thing to laugh about in London.<|im_end|>", -0.6124812364578247, 0.617023766040802, "You don't believe it, do you? Watson, no, no. And yet, it was one thing to laugh about it in london."], ["670", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>He declared, be you what you will and yet there is one thing to laugh about it in London.<|im_end|>", -0.6049650311470032, 0.6391386389732361, "You don't believe it, do you? Watson, no, no. And yet, it was one thing to laugh about it in london."], ["670", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>He declared to you, he said, I am ill, and yet there is one thing to laugh about in London.<|im_end|>", -0.807164192199707, 0.04420974478125572, "You don't believe it, do you? Watson, no, no. And yet, it was one thing to laugh about it in london."], ["670", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>He replied, but do you want to help me in that? And yet there is one thing to laugh about it in London.<|im_end|>", -0.9126564264297485, -0.2661791741847992, "You don't believe it, do you? Watson, no, no. And yet, it was one thing to laugh about it in london."], ["670", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>He had been a victim of hope, and yet there was one thing to laugh about it in London.<|im_end|>", -0.4558258652687073, 1.0779495239257812, "You don't believe it, do you? Watson, no, no. And yet, it was one thing to laugh about it in london."], ["670", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>He complained, but he was hotly in love. And yet there is one thing that I forgot to mention.<|im_end|>", -1.290951132774353, -1.3792325258255005, "You don't believe it, do you? Watson, no, no. And yet, it was one thing to laugh about it in london."], ["670", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>He declared, \"Do you think I am ill? And yet there is one thing to laugh about in London.\"<|im_end|>", -0.9214498996734619, -0.29205214977264404, "You don't believe it, do you? Watson, no, no. And yet, it was one thing to laugh about it in london."], ["670", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>I don't believe you, sir. I know it, and yet there is one thing to laugh about in London.<|im_end|>", -0.434049129486084, 1.1420230865478516, "You don't believe it, do you? Watson, no, no. And yet, it was one thing to laugh about it in london."]]}
wandb/run-20260418_172847-c2a5hfz3/files/media/table/completions_411_885808c4b4bd708583eb.table.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"columns": ["step", "prompt", "completion", "ASRWerSubLenCmpHalluDirtyV56", "advantages", "solution"], "data": [["820", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Captain markham, it's about about my wife. Polly answered, casting down her eyes and returning a very red. The other day, the whistle.<|im_end|>", 0.1822807341814041, -0.6647002696990967, "Captain marker, it's about about my wife. Crawley answered, casting down his eyes and turning very red. The other gave a whistle."], ["820", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Captain martin, it's about about my wife, crawley answered, casting down his eyes and returning a very red. The other day, the whistle.<|im_end|>", 0.3173089027404785, -0.11428264528512955, "Captain marker, it's about about my wife. Crawley answered, casting down his eyes and turning very red. The other gave a whistle."], ["820", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Captain marten, it's about about my wife. Crawley answered, casting down his eyes and returning a very red. The other gave a whistle.<|im_end|>", 0.7004733681678772, 1.4476171731948853, "Captain marker, it's about about my wife. Crawley answered, casting down his eyes and turning very red. The other gave a whistle."], ["820", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Captain martin, it's about about my wife. Polly answered, casting down her eyes and returning a very red. The other day, the whistle.<|im_end|>", 0.1813155859708786, -0.6686345338821411, "Captain marker, it's about about my wife. Crawley answered, casting down his eyes and turning very red. The other gave a whistle."], ["820", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>At evening upon the world, while others hint that knowledge of these might undo our civilization. There watched him ceaselessly from the underpits those eyes whose duty it is from further within and deeper.<|im_end|>", 0.8152623176574707, -1.2966564893722534, "At evening upon the world, while others hint that knowledge of these might undo our civilization, there watched him ceaselessly from the under pits, those eyes whose duty it is from further within and deeper."], ["820", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>At evening upon the world, while others hint that knowledge of these might undo our civilization, there watched him ceaselessly from the under pits those eyes whose duty it is from further within and deeper.<|im_end|>", 0.9336058497428894, 1.1373971700668335, "At evening upon the world, while others hint that knowledge of these might undo our civilization, there watched him ceaselessly from the under pits, those eyes whose duty it is from further within and deeper."], ["820", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>At evening upon the world, while others hint that knowledge of these might undo our civilization, there watched him ceaselessly from the underpits those eyes whose duty it is from further within and deeper.<|im_end|>", 0.8821772933006287, 0.0796302929520607, "At evening upon the world, while others hint that knowledge of these might undo our civilization, there watched him ceaselessly from the under pits, those eyes whose duty it is from further within and deeper."], ["820", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>At evening upon the world, while others hint that knowledge of these might undo our civilization, there watched him ceaselessly from the underpits those eyes whose duty it is from further within and deeper.<|im_end|>", 0.8821772933006287, 0.0796302929520607, "At evening upon the world, while others hint that knowledge of these might undo our civilization, there watched him ceaselessly from the under pits, those eyes whose duty it is from further within and deeper."], ["820", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Milly steered her magnificent way like some great liner cleaving among the canoes of howling savages. Our goddess of grub was built on lines so majestic that they could be followed only with awe.<|im_end|>", 1.0, 0.0, "Milly steered her magnificent way like some great liner cleaving among the canoes of howling savages. Our goddess of grub was built on lines so majestic that they could be followed only with awe."], ["820", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Milly steered her magnificent way like some great liner cleaving among the canoes of howling savages. Our goddess of grub was built on lines so majestic that they could be followed only with awe.<|im_end|>", 1.0, 0.0, "Milly steered her magnificent way like some great liner cleaving among the canoes of howling savages. Our goddess of grub was built on lines so majestic that they could be followed only with awe."], ["820", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Milly steered her magnificent way like some great liner cleaving among the canoes of howling savages. Our goddess of grub was built on lines so majestic that they could be followed only with awe.<|im_end|>", 1.0, 0.0, "Milly steered her magnificent way like some great liner cleaving among the canoes of howling savages. Our goddess of grub was built on lines so majestic that they could be followed only with awe."], ["820", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Milly steered her magnificent way like some great liner cleaving among the canoes of howling savages. Our goddess of grub was built on lines so majestic that they could be followed only with awe.<|im_end|>", 1.0, 0.0, "Milly steered her magnificent way like some great liner cleaving among the canoes of howling savages. Our goddess of grub was built on lines so majestic that they could be followed only with awe."], ["820", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>And may properly lavish time and store it upon. It is not improbable that glossy buttons are a valid feature of the garb of a humdrum and harassed hospital porter many intellect.<|im_end|>", 0.38166147470474243, 0.8561707735061646, "And may properly lavish time and trouble thereupon. It is not arguable that glossy buttons are a valid feature of the garb of a humdrum and harassed hospital, orderly many a time."], ["820", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>And may properly lavish time and reward him upon it is not improbable that glossy buttons are a valid feature of the garb of a humdrum and grassy hospital porter many intellect.<|im_end|>", 0.2887856066226959, 0.24522322416305542, "And may properly lavish time and trouble thereupon. It is not arguable that glossy buttons are a valid feature of the garb of a humdrum and harassed hospital, orderly many a time."], ["820", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>And may properly lavish time and store their money in it is not improbable that glossy buttons are a valid feature of the garb of a humdrum and harassed hospital portmanteau many intellect.<|im_end|>", 0.30360567569732666, 0.3427112400531769, "And may properly lavish time and trouble thereupon. It is not arguable that glossy buttons are a valid feature of the garb of a humdrum and harassed hospital, orderly many a time."], ["820", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>And may properly lavish time at his work of art. It is not improbable that glossy buttons are a valid feature in the garb of a humdrum and grassy hospital wardrobes many intellect.<|im_end|>", 0.031974904239177704, -1.4441053867340088, "And may properly lavish time and trouble thereupon. It is not arguable that glossy buttons are a valid feature of the garb of a humdrum and harassed hospital, orderly many a time."], ["820", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>And shahrazad perceived the dawn of day and ceased saying her permitted say, when it was the six hundred and seventy seventh night she pursued, it hath reached me o auspicious king that when the kafirs fell upon harib.<|im_end|>", 0.6396347880363464, -0.8913764357566833, "And shahrazad perceived the dawn of day and ceased saying her permitted say. When it was the six hundred and seventy seventh night, she pursued it. Hath reached me o auspicious king, that when the kafirs fell upon gharib."], ["820", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>And shahrazad perceived the dawn of day and ceased saying her permitted say, when it was the six hundred and seventy seventh night, she pursued it hath reached me o auspicious king that when the kafirs fell upon harib.<|im_end|>", 0.7608726620674133, 1.3088793754577637, "And shahrazad perceived the dawn of day and ceased saying her permitted say. When it was the six hundred and seventy seventh night, she pursued it. Hath reached me o auspicious king, that when the kafirs fell upon gharib."], ["820", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>And shahrazad perceived the dawn of day and ceased saying her permitted say when it was the six hundred and seventy seventh night, she pursued. It hath reached me o auspicious king that when the kafirs fell upon harib.<|im_end|>", 0.7017130255699158, 0.23523521423339844, "And shahrazad perceived the dawn of day and ceased saying her permitted say. When it was the six hundred and seventy seventh night, she pursued it. Hath reached me o auspicious king, that when the kafirs fell upon gharib."], ["820", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>And Shahrazad perceived the dawn of day and ceased saying her permitted say when it was the six hundred seventy seventh night, she pursued it hath reached me o auspicious king that when the kaffirs fell upon harib.<|im_end|>", 0.6527841091156006, -0.6527392268180847, "And shahrazad perceived the dawn of day and ceased saying her permitted say. When it was the six hundred and seventy seventh night, she pursued it. Hath reached me o auspicious king, that when the kafirs fell upon gharib."], ["820", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>these he would make reply but was from a certain person whom perhaps we need not name then the whiskey bottle would move forward like a pawn in chess and the next suited words would be<|im_end|>", 0.74958735704422, 0.16212931275367737, "deasey would make reply but twas from a certain person whom perhaps we need not name then the whiskey bottle would move forward like a pawn in chess and the next soothing words would be"], ["820", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>these he would make reply, but was found on a certain person whom perhaps we need not name. Then the whiskey bottle would move forward like a pawn in chess and the next soothing words would be<|im_end|>", 0.5462133884429932, -1.4572458267211914, "deasey would make reply but twas from a certain person whom perhaps we need not name then the whiskey bottle would move forward like a pawn in chess and the next soothing words would be"], ["820", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>these he would make reply but was from a certain person whom perhaps we need not name then the whiskey bottle would move forward like a pawn in chess and the next soothing words would be<|im_end|>", 0.8178245425224304, 0.7054712176322937, "deasey would make reply but twas from a certain person whom perhaps we need not name then the whiskey bottle would move forward like a pawn in chess and the next soothing words would be"], ["820", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>easy would make reply but was from a certain person whom perhaps we need not name then the whiskey bottle would move forward like a pawn in chess and the next suited words would be<|im_end|>", 0.8032783269882202, 0.5896462798118591, "deasey would make reply but twas from a certain person whom perhaps we need not name then the whiskey bottle would move forward like a pawn in chess and the next soothing words would be"], ["820", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>He did in fact begin it when setting out on the aforementioned second trip to europe, calling it.<|im_end|>", 0.7412750124931335, 0.0, "He did, in fact, begin it when setting out on the aforementioned second trip to europe, calling it."], ["820", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>He did in fact begin it when setting out on the aforementioned second trip to europe, calling it.<|im_end|>", 0.7412750124931335, 0.0, "He did, in fact, begin it when setting out on the aforementioned second trip to europe, calling it."], ["820", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>He did in fact begin it when setting out on the aforementioned second trip to europe, calling it.<|im_end|>", 0.7412750124931335, 0.0, "He did, in fact, begin it when setting out on the aforementioned second trip to europe, calling it."], ["820", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>He did in fact begin it when setting out on the aforementioned second trip to Europe, calling it.<|im_end|>", 0.7412750124931335, 0.0, "He did, in fact, begin it when setting out on the aforementioned second trip to europe, calling it."], ["820", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Fayard knew that his master was upon him, and he started off upon a rapid pace. And in a few moments, he had ridden on. Malagigi pretended to be in great alarm. O noble king and master, he cried, my poor companion has run away with me. He will fall and break his neck.<|im_end|>", 0.40350231528282166, 0.19367654621601105, "Bayard knew that his master was upon him, and he started off upon a rapid pace, and in a few moments was a good way off. Malagigi pretended to be in great alarm o, noble king and master. He cried, my poor companion is run away with he will fall and break his neck."], ["820", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Veyard knew that his master was upon him, and he started off upon a rapid pace. And in a few moments, he had got well up. Malagigi pretended to be in great alarm. O noble king and master, he cried, my poor companion has run away with me. He will fall and break his neck.<|im_end|>", 0.3942375183105469, -0.0513581745326519, "Bayard knew that his master was upon him, and he started off upon a rapid pace, and in a few moments was a good way off. Malagigi pretended to be in great alarm o, noble king and master. He cried, my poor companion is run away with he will fall and break his neck."], ["820", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Bayard knew that his master was upon him, and he started off upon a rapid pace. And in a few moments, he had got well up. Malagigi pretended to be in great alarm. O noble king and master, he cried, my poor companion has run away with. He will fall and break his neck.<|im_end|>", 0.4392834007740021, 1.140012264251709, "Bayard knew that his master was upon him, and he started off upon a rapid pace, and in a few moments was a good way off. Malagigi pretended to be in great alarm o, noble king and master. He cried, my poor companion is run away with he will fall and break his neck."], ["820", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Fayard knew that his master was upon him, and he started off upon a rapid pace. And in a few moments, he had gone on maledijiji. Pretended to be in great alarm. O noble king and master, he cried, my poor companion has run away with me. He will fall and break his neck.<|im_end|>", 0.3476942181587219, -1.282332181930542, "Bayard knew that his master was upon him, and he started off upon a rapid pace, and in a few moments was a good way off. Malagigi pretended to be in great alarm o, noble king and master. He cried, my poor companion is run away with he will fall and break his neck."], ["820", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>She laid a firm, delicate hand on her gold green jerkin. Elidor, this was pleasant, but we got no nearer. We can't sit here and learn the language. Terry protested.<|im_end|>", 0.9210602045059204, -1.0414021015167236, "She laid a firm, delicate hand on her gold green jerkin. Ellador, this was pleasant, but we got no nearer. We can't sit here and learn the language. Terry protested."], ["820", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>She laid a firm, delicate hand on her gold green jerkin. Ellador. This was pleasant, but we got no nearer. We can't sit here and learn the language. Terry protested.<|im_end|>", 0.9217362999916077, 0.006559576839208603, "She laid a firm, delicate hand on her gold green jerkin. Ellador, this was pleasant, but we got no nearer. We can't sit here and learn the language. Terry protested."], ["820", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>She laid a firm, delicate hand on her gold green jerkin. Ellador. This was pleasant, but we got no nearer. We can't sit here and learn the language. Terry protested.<|im_end|>", 0.9217362999916077, 0.006559576839208603, "She laid a firm, delicate hand on her gold green jerkin. Ellador, this was pleasant, but we got no nearer. We can't sit here and learn the language. Terry protested."], ["820", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>She laid a firm, delicate hand on her gold green jerkin. Ellador this was pleasant, but we got no nearer. We can't sit here and learn the language. Terry protested.<|im_end|>", 0.9223955273628235, 1.0283753871917725, "She laid a firm, delicate hand on her gold green jerkin. Ellador, this was pleasant, but we got no nearer. We can't sit here and learn the language. Terry protested."], ["820", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>he cried out sadly and fought and struggled two minutes however he did little against his four adversaries and worn out with his struggle clive suddenly went from dusty boy to motionless spirit lost lost he muttered all lost<|im_end|>", -0.10845243185758591, 0.03154230862855911, "he cried out savagely and fought with the strength of two men however he could do little against his four adversaries and worn out with the struggle collapsed suddenly on to the dusty floor with a motion of despair lost lost he muttered all lost"], ["820", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>he cried out sadly and fought and strived for two minutes however he did little against his four adversaries and worn out with his struggle, clapped suddenly on the dusty floor with a motionless spirit lost, lost he muttered all lost<|im_end|>", 0.1065172553062439, 1.328436017036438, "he cried out savagely and fought with the strength of two men however he could do little against his four adversaries and worn out with the struggle collapsed suddenly on to the dusty floor with a motion of despair lost lost he muttered all lost"], ["820", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>he cried out sadly and fought and struggled two minutes however he did little against four adversaries and worn out with his struggle clive suddenly went from dusty boy with emotion in his spirit lost, lost, he muttered, all lost<|im_end|>", -0.29121696949005127, -1.0710604190826416, "he cried out savagely and fought with the strength of two men however he could do little against his four adversaries and worn out with the struggle collapsed suddenly on to the dusty floor with a motion of despair lost lost he muttered all lost"], ["820", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>he cried out sadly and fought and struggled to win it however he did little against four adversaries and worn out with his struggle clive suddenly hung from the dusty floor with emotion in his spirit lost, lost he muttered all, lost<|im_end|>", -0.16157105565071106, -0.28891777992248535, "he cried out savagely and fought with the strength of two men however he could do little against his four adversaries and worn out with the struggle collapsed suddenly on to the dusty floor with a motion of despair lost lost he muttered all lost"], ["820", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>And thus he accomplished this by the bye during the siege of the city, for he had his enemies in great contempt already. Nine when he had thus married mariamne.<|im_end|>", 0.6356512308120728, -1.4962533712387085, "And thus he accomplished this by the by, during the siege of the city. For he had his enemies in great contempt already nine when he had thus married mariamne, he."], ["820", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>And thus he accomplished this by the bye during the siege of the city, for he had his enemies in great contempt already nine when he had thus married mariamne.<|im_end|>", 0.715508222579956, 0.49875012040138245, "And thus he accomplished this by the by, during the siege of the city. For he had his enemies in great contempt already nine when he had thus married mariamne, he."], ["820", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>And thus he accomplished this by the bye during the siege of the city, for he had his enemies in great contempt already nine when he had thus married mariamne.<|im_end|>", 0.715508222579956, 0.49875012040138245, "And thus he accomplished this by the by, during the siege of the city. For he had his enemies in great contempt already nine when he had thus married mariamne, he."], ["820", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>And thus he accomplished this by the bye during the siege of the city, for he had his enemies in great contempt already nine when he had thus married mariamne.<|im_end|>", 0.715508222579956, 0.49875012040138245, "And thus he accomplished this by the by, during the siege of the city. For he had his enemies in great contempt already nine when he had thus married mariamne, he."], ["820", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Putting both hands on her shoulders and looking into the brown eyes, should you be willing to go abroad with your mother and phronsie mister king and jasper? Oh polly gasped. But you.<|im_end|>", 0.7878445386886597, -0.38495707511901855, "Putting both hands on her shoulders and looking into the brown eyes, should you be willing to go abroad with your mother and phronsie, mister king and jasper? Oh, polly gasped, but you."], ["820", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Putting both hands on her shoulders and looking into the brown eyes, should you be willing to go abroad with your mother and phronsie? Mister king and jasper. Oh polly gasped but you.<|im_end|>", 0.7167295217514038, -1.1612764596939087, "Putting both hands on her shoulders and looking into the brown eyes, should you be willing to go abroad with your mother and phronsie, mister king and jasper? Oh, polly gasped, but you."], ["820", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Putting both hands on her shoulders and looking into the brown eyes, should you be willing to go abroad with your mother and phronsie, mister king and jasper? Oh Polly gasped, but you.<|im_end|>", 0.9294845461845398, 1.1612406969070435, "Putting both hands on her shoulders and looking into the brown eyes, should you be willing to go abroad with your mother and phronsie, mister king and jasper? Oh, polly gasped, but you."], ["820", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Putting both hands on her shoulders and looking into the brown eyes, should you be willing to go abroad with your mother and phronsie mister king and jasper? Oh, polly gasped. But you.<|im_end|>", 0.858376145362854, 0.3849935233592987, "Putting both hands on her shoulders and looking into the brown eyes, should you be willing to go abroad with your mother and phronsie, mister king and jasper? Oh, polly gasped, but you."]]}
wandb/run-20260418_172847-c2a5hfz3/files/media/table/completions_43_9ca1008a424f8bb91c1c.table.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"columns": ["step", "prompt", "completion", "ASRWerSubLenCmpHalluDirtyV56", "advantages", "solution"], "data": [["85", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Hospitality to persuasion, dissuasion and evasion, a rebel.<|im_end|>", -0.0990181490778923, 0.05529142543673515, "Hospitable to persuasion, dissuasion and evasion. Rebel."], ["85", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Hospitality to persuasion, dissuasion and evasion a rebel.<|im_end|>", -0.09743088483810425, 0.06276065856218338, "Hospitable to persuasion, dissuasion and evasion. Rebel."], ["85", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Hospitality to persuasion, dissuasion and evasion, a rebel.<|im_end|>", -0.0990181490778923, 0.05529142543673515, "Hospitable to persuasion, dissuasion and evasion. Rebel."], ["85", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Hospitality to persuasion, dissuasion and evasion of a rebel.<|im_end|>", -0.6668598651885986, -2.6168177127838135, "Hospitable to persuasion, dissuasion and evasion. Rebel."], ["85", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Hospitality to persuasion, dissuasion and evasion a rebel.<|im_end|>", -0.09743088483810425, 0.06276065856218338, "Hospitable to persuasion, dissuasion and evasion. Rebel."], ["85", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Hospitality to persuasion, dissuasion and evasion, a rebel.<|im_end|>", -0.0990181490778923, 0.05529142543673515, "Hospitable to persuasion, dissuasion and evasion. Rebel."], ["85", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Hospitality to persuasion, dissuasion and evasion a rebel.<|im_end|>", -0.09743088483810425, 0.06276065856218338, "Hospitable to persuasion, dissuasion and evasion. Rebel."], ["85", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Hospitality to persuasion, dissuasion and evasion, a rebel.<|im_end|>", -0.0990181490778923, 0.05529142543673515, "Hospitable to persuasion, dissuasion and evasion. Rebel."], ["85", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Hospitable to persuasion, dissuasion and evasion, a rebel.<|im_end|>", 0.31988954544067383, 2.026557445526123, "Hospitable to persuasion, dissuasion and evasion. Rebel."], ["85", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Hospitality to persuasion, dissuasion and evasion a rebel.<|im_end|>", -0.09743088483810425, 0.06276065856218338, "Hospitable to persuasion, dissuasion and evasion. Rebel."], ["85", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Hospitality to persuasion, dissuasion and evasion, a rebel.<|im_end|>", -0.0990181490778923, 0.05529142543673515, "Hospitable to persuasion, dissuasion and evasion. Rebel."], ["85", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Hospitality to persuasion, dissuasion and evasion a rebel.<|im_end|>", -0.09743088483810425, 0.06276065856218338, "Hospitable to persuasion, dissuasion and evasion. Rebel."], ["85", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>But my sister must know you, she must until she need. Added richard pentecost.<|im_end|>", -0.9152219295501709, -1.1293256282806396, "Ah, but my sister must know you. She must, in case of need, have you to depend upon."], ["85", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Ah, but my sister must know you she must until she need had reached a point of health.<|im_end|>", -0.8091338276863098, 0.08761630952358246, "Ah, but my sister must know you. She must, in case of need, have you to depend upon."], ["85", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Ah, but my sister must know you she must until she need had reached a point of calm.<|im_end|>", -0.805532693862915, 0.12892509996891022, "Ah, but my sister must know you. She must, in case of need, have you to depend upon."], ["85", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>But my sister must know you, she must until she need had reached a point of time.<|im_end|>", -0.9473012685775757, -1.4973094463348389, "Ah, but my sister must know you. She must, in case of need, have you to depend upon."], ["85", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Ah, but my sister must know you, she must until he's met college de pontiac.<|im_end|>", -0.7323250770568848, 0.9686933755874634, "Ah, but my sister must know you. She must, in case of need, have you to depend upon."], ["85", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Ah, but my sister must know you she must until he's met had reached a point of it.<|im_end|>", -0.8147860765457153, 0.022779079154133797, "Ah, but my sister must know you. She must, in case of need, have you to depend upon."], ["85", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Ah, but my sister must know you she must until her death. I urged a point of time.<|im_end|>", -0.8164224624633789, 0.0040080128237605095, "Ah, but my sister must know you. She must, in case of need, have you to depend upon."], ["85", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Ah, but my sister must know you she must until she need had reached a point of time.<|im_end|>", -0.8074418306350708, 0.10702529549598694, "Ah, but my sister must know you. She must, in case of need, have you to depend upon."], ["85", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Ah, but my sister must know you she must until she need had reached a point of calm.<|im_end|>", -0.805532693862915, 0.12892509996891022, "Ah, but my sister must know you. She must, in case of need, have you to depend upon."], ["85", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Ah, but my sister must know you. She must until she need have reached a point of that.<|im_end|>", -0.6205787658691406, 2.2505409717559814, "Ah, but my sister must know you. She must, in case of need, have you to depend upon."], ["85", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>But my sister must know you, she must until tonight. Added, reached a pinnacle.<|im_end|>", -0.919543445110321, -1.1788979768753052, "Ah, but my sister must know you. She must, in case of need, have you to depend upon."], ["85", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Ah, but my sister must know you she must until she need had reached a point of that.<|im_end|>", -0.8074418306350708, 0.10702529549598694, "Ah, but my sister must know you. She must, in case of need, have you to depend upon."], ["85", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>My fellow, come along. He caught my arm and following our guide we hurried on through the darkness which was so dense that it did not bide to the wonderful eyesight of my black companion. A faculty which seemed to have been acquired.<|im_end|>", 0.5165535807609558, 1.6058197021484375, "black fellow come along he caught my arm and following our guide we hurried on through the darkness which was so dense that if it had not been for the wonderful eyesight of my black companion a faculty which seemed to have been acquired"], ["85", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>My fellow, come along. He caught my arm and following our guide we hurried on through the darkness which was so dense that it did not bid for the wonderful eyesight of my black companion. On the faculty which seemed to admit acquired.<|im_end|>", 0.34349849820137024, 0.2518061101436615, "black fellow come along he caught my arm and following our guide we hurried on through the darkness which was so dense that if it had not been for the wonderful eyesight of my black companion a faculty which seemed to have been acquired"], ["85", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>My fellow, come along. He cut my arm and following our guide we hurried on through the darkness which was so dense that it did not bid for the wonderful eyesight of my black companion. On the faculty which seemed to admit of acquired.<|im_end|>", 0.2730351984500885, -0.299511194229126, "black fellow come along he caught my arm and following our guide we hurried on through the darkness which was so dense that if it had not been for the wonderful eyesight of my black companion a faculty which seemed to have been acquired"], ["85", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>My fellow, come along. He caught my arm and following our guide we hurried on through the darkness which was so dense that it did not bide for the wonderful eyesight of my black companion. The faculty with speed to admit acquired.<|im_end|>", 0.2683812379837036, -0.33592459559440613, "black fellow come along he caught my arm and following our guide we hurried on through the darkness which was so dense that if it had not been for the wonderful eyesight of my black companion a faculty which seemed to have been acquired"], ["85", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>My fellow, come along. He caught my arm and following our guide we hurried on through the darkness which was so dense that it did not bide for the wonderful eyesight of my black companion. On the faculty with speed to admit the acquired.<|im_end|>", 0.20993445813655853, -0.7932225465774536, "black fellow come along he caught my arm and following our guide we hurried on through the darkness which was so dense that if it had not been for the wonderful eyesight of my black companion a faculty which seemed to have been acquired"], ["85", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>My fellow, come along. He caught my arm and following our guide we hurried on through the darkness which was so dense that it did not bid for the wonderful eyesight of my black companion. A faculty which seemed to have been acquired.<|im_end|>", 0.5796752572059631, 2.0996947288513184, "black fellow come along he caught my arm and following our guide we hurried on through the darkness which was so dense that if it had not been for the wonderful eyesight of my black companion a faculty which seemed to have been acquired"], ["85", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>My fellow, come along. He caught my arm and following our guide we hurried on through the darkness which was so dense that it did not bid for the wonderful eyesight of my black companion. On the faculty which seemed to admit of acquired.<|im_end|>", 0.3366594910621643, 0.19829651713371277, "black fellow come along he caught my arm and following our guide we hurried on through the darkness which was so dense that if it had not been for the wonderful eyesight of my black companion a faculty which seemed to have been acquired"], ["85", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>My fellow, come along. He caught my arm and following our guide we hurried on through the darkness which was so dense that it did not bid for the wonderful eyesight of my black companion. On the faculty which seemed to admit of acquired.<|im_end|>", 0.3366594910621643, 0.19829651713371277, "black fellow come along he caught my arm and following our guide we hurried on through the darkness which was so dense that if it had not been for the wonderful eyesight of my black companion a faculty which seemed to have been acquired"], ["85", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>My fellow, come along. He caught my arm and following our guide we hurried on through the darkness which was so dense that it did not bid for the wonderful eyesight of my black companion. I was faculty with speed to a myth of acquired.<|im_end|>", 0.15785956382751465, -1.2006657123565674, "black fellow come along he caught my arm and following our guide we hurried on through the darkness which was so dense that if it had not been for the wonderful eyesight of my black companion a faculty which seemed to have been acquired"], ["85", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>My fellow, come along. He cut my arm and following our guide we hurried on through the darkness which was so dense that it did not bid for the wonderful eyesight of my black companion. On the faculty which seemed to admit of acquired.<|im_end|>", 0.2730351984500885, -0.299511194229126, "black fellow come along he caught my arm and following our guide we hurried on through the darkness which was so dense that if it had not been for the wonderful eyesight of my black companion a faculty which seemed to have been acquired"], ["85", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>My fellow, come along. He caught my arm and following our guide we hurried on through the darkness which was so dense that it did not bid for the wonderful eyesight of my black companion. By the faculty which seemed to admit it, I inquired.<|im_end|>", 0.2825254499912262, -0.22525779902935028, "black fellow come along he caught my arm and following our guide we hurried on through the darkness which was so dense that if it had not been for the wonderful eyesight of my black companion a faculty which seemed to have been acquired"], ["85", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>My fellow, come along. He cut my arm and following our guide we hurried on through the darkness which was so dense that it did not bide for the wonderful eyesight of my black companion. On the faculty which speeded him inquired.<|im_end|>", 0.15796764194965363, -1.1998201608657837, "black fellow come along he caught my arm and following our guide we hurried on through the darkness which was so dense that if it had not been for the wonderful eyesight of my black companion a faculty which seemed to have been acquired"], ["85", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Scrapper's slightly raised cap seemed all black, but Peter turned up close enough and what he found couldn't eat was a patch of brown fur. While Peter sat staring up at him, Scrapper suddenly darted out into the air.<|im_end|>", 0.11510307341814041, 2.3401176929473877, "Scrapper's slightly raised cap seemed all black. But if peter could have gotten close enough, he would have found that hidden in it was a patch of orange red. While peter sat staring up at him, scrapper suddenly darted out into the air."], ["85", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Scrapper's slightly raised cap seemed all black and quite quite ugly, so that he really found it good indeed was a patch of pure white while peter sat staring up at him scrapper suddenly darted out into the air.<|im_end|>", -0.09485074132680893, -1.0294468402862549, "Scrapper's slightly raised cap seemed all black. But if peter could have gotten close enough, he would have found that hidden in it was a patch of orange red. While peter sat staring up at him, scrapper suddenly darted out into the air."], ["85", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Scrapper's slightly raised cap seemed, while black but dark and ugly close enough in a way that he couldn't eat was a patch of clear thread. While Peter sat staring up at him, Scrapper suddenly darted out into the air.<|im_end|>", -0.10472522675991058, -1.1879230737686157, "Scrapper's slightly raised cap seemed all black. But if peter could have gotten close enough, he would have found that hidden in it was a patch of orange red. While peter sat staring up at him, scrapper suddenly darted out into the air."], ["85", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Scrapper's slightly raised cap seemed all black, but in a corner close enough to where he had found good meat was a patch of brown fur. While Peter sat staring up at him, Scrapper suddenly darted out into the air.<|im_end|>", 0.03434121981263161, 1.0439646244049072, "Scrapper's slightly raised cap seemed all black. But if peter could have gotten close enough, he would have found that hidden in it was a patch of orange red. While peter sat staring up at him, scrapper suddenly darted out into the air."], ["85", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Scrapper's slightly raised cap seemed by black, but Peter couldn't get close enough and what he found couldn't eat was a patch of iron thread while peter sat staring up at him scrapper suddenly darted out into the air.<|im_end|>", -0.019613485783338547, 0.17804156243801117, "Scrapper's slightly raised cap seemed all black. But if peter could have gotten close enough, he would have found that hidden in it was a patch of orange red. While peter sat staring up at him, scrapper suddenly darted out into the air."], ["85", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Scrapper's slightly raised cap seemed mob black like a peanut gum kerosene, and what he found couldn't eat was a patch of burned hair. While Peter sat staring up at him, Scrapper suddenly darted out into the air.<|im_end|>", -0.09868084639310837, -1.0909165143966675, "Scrapper's slightly raised cap seemed all black. But if peter could have gotten close enough, he would have found that hidden in it was a patch of orange red. While peter sat staring up at him, scrapper suddenly darted out into the air."], ["85", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Scrapper's slightly raised cap seemed rather black, but Peter put it down cautiously and what he found couldn't eat was a patch of brown fur. While Peter sat staring up at him, Scrapper suddenly darted out into the air.<|im_end|>", -0.027708640322089195, 0.048121821135282516, "Scrapper's slightly raised cap seemed all black. But if peter could have gotten close enough, he would have found that hidden in it was a patch of orange red. While peter sat staring up at him, scrapper suddenly darted out into the air."], ["85", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Scrapper's slightly raised cap seemed rather black, but Peter couldn't go closer than he really found it good and neat was a patch of fine fur while Peter sat staring up at him scrapper suddenly darted out into the air.<|im_end|>", -0.034929804503917694, -0.06777118146419525, "Scrapper's slightly raised cap seemed all black. But if peter could have gotten close enough, he would have found that hidden in it was a patch of orange red. While peter sat staring up at him, scrapper suddenly darted out into the air."], ["85", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Scrapper's slightly raised cap seemed rather black, but peter put it down close enough that he really found it good and neat as a patch of pure thread. While peter sat staring up at him, scrapper suddenly darted out into the air.<|im_end|>", -0.0638682171702385, -0.5322059392929077, "Scrapper's slightly raised cap seemed all black. But if peter could have gotten close enough, he would have found that hidden in it was a patch of orange red. While peter sat staring up at him, scrapper suddenly darted out into the air."], ["85", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Scrapper's slightly raised cap seemed rather black, but Peter couldn't get close enough to look down and could n't eat was a patch of pure white. While Peter sat staring up at him, Scrapper suddenly darted out into the air.<|im_end|>", -0.03125457838177681, -0.008787202648818493, "Scrapper's slightly raised cap seemed all black. But if peter could have gotten close enough, he would have found that hidden in it was a patch of orange red. While peter sat staring up at him, scrapper suddenly darted out into the air."], ["85", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Scrapper's slightly raised cap seemed all black, but through it came a glimpse of that he had really found good and eat was a patch of brown fur. While Peter sat staring up at him, Scrapper suddenly darted out into the air.<|im_end|>", 0.005603947211056948, 0.5827580094337463, "Scrapper's slightly raised cap seemed all black. But if peter could have gotten close enough, he would have found that hidden in it was a patch of orange red. While peter sat staring up at him, scrapper suddenly darted out into the air."], ["85", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Scrapper's slightly raised cap seemed odd black, but Peter couldn't have told you that he really found it good and neat as a patch of fine thread while Peter sat staring up at him Scrapper suddenly darted out into the air.<|im_end|>", -0.04790138080716133, -0.2759529650211334, "Scrapper's slightly raised cap seemed all black. But if peter could have gotten close enough, he would have found that hidden in it was a patch of orange red. While peter sat staring up at him, scrapper suddenly darted out into the air."]]}
wandb/run-20260418_172847-c2a5hfz3/files/media/table/completions_63_9c15897616f0ff0b68b9.table.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"columns": ["step", "prompt", "completion", "ASRWerSubLenCmpHalluDirtyV56", "advantages", "solution"], "data": [["125", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Or go on forever without swerving to the right or to the left that is what it means to escape this paralysis you should ask how does a straight line feel it feels as I suppose it must straight<|im_end|>", 0.8176915645599365, -0.15929217636585236, "or go on forever without swerving to the right or to the left that is what it means to escape this moralizing you should ask how does the straight line feel it feels as i suppose it looks straight"], ["125", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Or go on forever without swerving to the right or to the left that is what it means to escape this paralysis you should ask how does a straight line feel it feels as I suppose it must straight<|im_end|>", 0.8176915645599365, -0.15929217636585236, "or go on forever without swerving to the right or to the left that is what it means to escape this moralizing you should ask how does the straight line feel it feels as i suppose it looks straight"], ["125", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Or go on forever without swerving to the right or to the left that is what it means to escape this paralysis you should ask how does the straight line feel it feels as I suppose it must straight<|im_end|>", 0.8759769797325134, 0.7718859910964966, "or go on forever without swerving to the right or to the left that is what it means to escape this moralizing you should ask how does the straight line feel it feels as i suppose it looks straight"], ["125", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Or go on forever without swerving to the right or to the left that is what it means to escape this paralysis you should ask how does the straight line feel it feels as I suppose it must straight<|im_end|>", 0.8759769797325134, 0.7718859910964966, "or go on forever without swerving to the right or to the left that is what it means to escape this moralizing you should ask how does the straight line feel it feels as i suppose it looks straight"], ["125", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Or go on forever without swerving to the right or to the left that is what it means to escape this paralysis you should ask how does the straight line feel it feels as I suppose it must straight<|im_end|>", 0.8759769797325134, 0.7718859910964966, "or go on forever without swerving to the right or to the left that is what it means to escape this moralizing you should ask how does the straight line feel it feels as i suppose it looks straight"], ["125", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Or go on forever without stopping to the right or to the left that is what it means to escape this paralysis you should ask how does the straight line feel it feels as I suppose it must straight<|im_end|>", 0.8153555989265442, -0.19661197066307068, "or go on forever without swerving to the right or to the left that is what it means to escape this moralizing you should ask how does the straight line feel it feels as i suppose it looks straight"], ["125", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Or go on forever without stopping to the right or to the left that is what it means to escape this paralysis you should ask how does the straight line feel it feels as I suppose it must straight<|im_end|>", 0.8153555989265442, -0.19661197066307068, "or go on forever without swerving to the right or to the left that is what it means to escape this moralizing you should ask how does the straight line feel it feels as i suppose it looks straight"], ["125", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Or go on forever without stopping to the right or to the left that is what it means to escape the spiral axis you should ask how does a straight line feel it feels as I suppose it must straight<|im_end|>", 0.6529189348220825, -2.791729211807251, "or go on forever without swerving to the right or to the left that is what it means to escape this moralizing you should ask how does the straight line feel it feels as i suppose it looks straight"], ["125", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Or go on forever without swerving to the right or to the left that is what it means to escape this paralysis you should ask how does the straight line feel it feels as I suppose it must straight<|im_end|>", 0.8759769797325134, 0.7718859910964966, "or go on forever without swerving to the right or to the left that is what it means to escape this moralizing you should ask how does the straight line feel it feels as i suppose it looks straight"], ["125", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Or go on forever without swerving to the right or to the left that is what it means to escape this paralysis you should ask how does the straight line feel it feels as I suppose it must straight<|im_end|>", 0.8759769797325134, 0.7718859910964966, "or go on forever without swerving to the right or to the left that is what it means to escape this moralizing you should ask how does the straight line feel it feels as i suppose it looks straight"], ["125", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Or go on forever without swerving to the right or to the left that is what it means to escape this paralysis you should ask how does a straight line feel it feels as I suppose it must straight<|im_end|>", 0.8176915645599365, -0.15929217636585236, "or go on forever without swerving to the right or to the left that is what it means to escape this moralizing you should ask how does the straight line feel it feels as i suppose it looks straight"], ["125", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Or go on forever without stopping to the right or to the left that is what it means to escape this paralysis you should ask how does the straight line feel it feels as I suppose it must straight<|im_end|>", 0.8153555989265442, -0.19661197066307068, "or go on forever without swerving to the right or to the left that is what it means to escape this moralizing you should ask how does the straight line feel it feels as i suppose it looks straight"], ["125", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>They twist his foot and beat him again, in another place. He that flattereth his neighbour spreadeth a net for mischief. So I will try to keep away from that lady, shall I not papa? Whenever you can do so without ruin this daughter.<|im_end|>", 0.04660210758447647, -0.13953234255313873, "Favor is deceitful, and beauty is vain. And in another place, he that flattereth his neighbor spreadeth a net for his feet. So I will try to keep away from that lady, shall I not? Papa, whenever you can do so without rudeness. Daughter."], ["125", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>They twist his neck and make him sing in another place, he that flattereth his neighbour spreadeth a net for his feet. So I will try to keep away from that lady, shall I not papa? Whenever you can do so without rudeness, daughter.<|im_end|>", 0.2873304486274719, 1.2487980127334595, "Favor is deceitful, and beauty is vain. And in another place, he that flattereth his neighbor spreadeth a net for his feet. So I will try to keep away from that lady, shall I not? Papa, whenever you can do so without rudeness. Daughter."], ["125", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>They twist and twist, and do as they will, in another place. He that flattereth his neighbour spreadeth a net for his gain. So I will try to keep away from that lady. Shall I not papa? Whenever you can do so without ruin, my daughter.<|im_end|>", 0.04480805993080139, -0.14987899363040924, "Favor is deceitful, and beauty is vain. And in another place, he that flattereth his neighbor spreadeth a net for his feet. So I will try to keep away from that lady, shall I not? Papa, whenever you can do so without rudeness. Daughter."], ["125", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>They twist and fold, and bend and sin in some other place he that flattereth his neighbour spreadeth a net for him so I will try to keep away from that lately shall I not papa whenever you can do so without rudeness daughter<|im_end|>", -0.06204881891608238, -0.7661447525024414, "Favor is deceitful, and beauty is vain. And in another place, he that flattereth his neighbor spreadeth a net for his feet. So I will try to keep away from that lady, shall I not? Papa, whenever you can do so without rudeness. Daughter."], ["125", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>save rooster's nest and bird's ass in another place, he that flattereth his neighbour spreadeth a net for himself. So I will try to keep away from that lady, shall I not papa? Whenever you can do so without rudeness, daughter.<|im_end|>", 0.25164204835891724, 1.0429755449295044, "Favor is deceitful, and beauty is vain. And in another place, he that flattereth his neighbor spreadeth a net for his feet. So I will try to keep away from that lady, shall I not? Papa, whenever you can do so without rudeness. Daughter."], ["125", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>They will see you there, and be as angry in another place. He that flattereth his neighbour spreadeth him nighfully. So I will try to keep away from that lady, shall I not papa? Whenever you can do so without rudeness, daughter.<|im_end|>", -0.12804561853408813, -1.1467620134353638, "Favor is deceitful, and beauty is vain. And in another place, he that flattereth his neighbor spreadeth a net for his feet. So I will try to keep away from that lady, shall I not? Papa, whenever you can do so without rudeness. Daughter."], ["125", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>save his sister's life and do as i say in another place, he that flattereth his neighbour spreadeth a net for him so I will try to keep away from that lady shall I not papa? Whenever you can do so without ruining this daughter.<|im_end|>", 0.05892462283372879, -0.06846584379673004, "Favor is deceitful, and beauty is vain. And in another place, he that flattereth his neighbor spreadeth a net for his feet. So I will try to keep away from that lady, shall I not? Papa, whenever you can do so without rudeness. Daughter."], ["125", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>They twist and wriggle, and do as they can. And in another place he that flattereth his neighbour spreadeth a net for him. So I will try to keep away from that lady, shall I not papa? Whenever you can do so without rudeness, daughter.<|im_end|>", 0.12734483182430267, 0.32612770795822144, "Favor is deceitful, and beauty is vain. And in another place, he that flattereth his neighbor spreadeth a net for his feet. So I will try to keep away from that lady, shall I not? Papa, whenever you can do so without rudeness. Daughter."], ["125", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>They twist and twirl, and turn and spin. And in another place, he that flattereth his neighbour spreadeth a net for his gain. So I will try to keep away from that way. Shall I not papa? Whenever you can do so without rudeness, daughter.<|im_end|>", 0.2292451709508896, 0.9138080477714539, "Favor is deceitful, and beauty is vain. And in another place, he that flattereth his neighbor spreadeth a net for his feet. So I will try to keep away from that lady, shall I not? Papa, whenever you can do so without rudeness. Daughter."], ["125", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>They please to see me and do as I say in another place he that flattereth his neighbour spreadeth him nectarously so I will try to keep away from that lady shall I not papa whenever you can do so without ruining us daughter<|im_end|>", -0.3151572346687317, -2.2258734703063965, "Favor is deceitful, and beauty is vain. And in another place, he that flattereth his neighbor spreadeth a net for his feet. So I will try to keep away from that lady, shall I not? Papa, whenever you can do so without rudeness. Daughter."], ["125", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>save his sister and do as he does in another place, he that flattereth his neighbour spreadeth a net for himself. So I will try to keep away from that lady, shall I not papa? Whenever you can do so without robbing his daughter.<|im_end|>", 0.1756473332643509, 0.6046982407569885, "Favor is deceitful, and beauty is vain. And in another place, he that flattereth his neighbor spreadeth a net for his feet. So I will try to keep away from that lady, shall I not? Papa, whenever you can do so without rudeness. Daughter."], ["125", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>They will, said he and do as they please. And in another place, he that flattereth his neighbour spreadeth a net for him. So I will try to keep away from that lady, shall I not papa? Whenever you can do so without robbing this daughter.<|im_end|>", 0.13326135277748108, 0.36024948954582214, "Favor is deceitful, and beauty is vain. And in another place, he that flattereth his neighbor spreadeth a net for his feet. So I will try to keep away from that lady, shall I not? Papa, whenever you can do so without rudeness. Daughter."], ["125", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>I was so anxious to hear a little about him to know what I could keep away that's another thing and shows me that if I didn't teach my boys anything else I did give them brotherly love that when they say how good we were in our services to all who came<|im_end|>", -0.27307480573654175, -0.7399817705154419, "i was so anxious to hear all about the dear old boy i couldn't keep away that's right comfortable and shows me that if i didn't teach my boys anything else i did give them the brotherly love that will make them stand by one another all their lives said missus jo when he had gone"], ["125", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>I was so anxious to hear a little about you to know what I could keep away that's enough and shows me that if I didn't teach my boys anything else, I did give them brotherly love, but with a samurai or battle of war civilities too formal<|im_end|>", -0.43343213200569153, -2.054769992828369, "i was so anxious to hear all about the dear old boy i couldn't keep away that's right comfortable and shows me that if i didn't teach my boys anything else i did give them the brotherly love that will make them stand by one another all their lives said missus jo when he had gone"], ["125", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>I was so anxious to hear about her, to know what I could keep away that's enough of it and shows me that if I didn't teach my boys anything else I did give them brotherly love that made their sad and lonely hours seem a little more palatable<|im_end|>", -0.2620263695716858, -0.6493943333625793, "i was so anxious to hear all about the dear old boy i couldn't keep away that's right comfortable and shows me that if i didn't teach my boys anything else i did give them the brotherly love that will make them stand by one another all their lives said missus jo when he had gone"], ["125", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>I was so anxious to hear a little about him, to know what I could keep away that's another thing and shows me that if I didn't teach my boys anything else I did give them brotherly love that when they say nothing of their own or some one is stupid or weak.<|im_end|>", -0.21280650794506073, -0.24583503603935242, "i was so anxious to hear all about the dear old boy i couldn't keep away that's right comfortable and shows me that if i didn't teach my boys anything else i did give them the brotherly love that will make them stand by one another all their lives said missus jo when he had gone"], ["125", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>I was so anxious to hear about you, dear boy, I couldn't keep away. That's another thing and shows me that if I didn't teach my boys anything else, I did give them a brotherly love that made their sad hour of trouble worse than the sickness itself.<|im_end|>", -0.23551680147647858, -0.432039350271225, "i was so anxious to hear all about the dear old boy i couldn't keep away that's right comfortable and shows me that if i didn't teach my boys anything else i did give them the brotherly love that will make them stand by one another all their lives said missus jo when he had gone"], ["125", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>I was so anxious to hear a little about him to know what I could keep away that's enough of it and shows me that if I didn't teach my boys anything else I did give them brotherly love that will render Sam happy or make their mothers' sinlessness superfluous<|im_end|>", -0.18895041942596436, -0.05023622140288353, "i was so anxious to hear all about the dear old boy i couldn't keep away that's right comfortable and shows me that if i didn't teach my boys anything else i did give them the brotherly love that will make them stand by one another all their lives said missus jo when he had gone"], ["125", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>I was so anxious to hear a little about her to a boy I couldn't keep away that's enough and shows me that if I didn't teach my boys anything else I did give them brotherly love that will in a sad hour bring back their own personal sympathies to my heart<|im_end|>", -0.0468180887401104, 1.1151231527328491, "i was so anxious to hear all about the dear old boy i couldn't keep away that's right comfortable and shows me that if i didn't teach my boys anything else i did give them the brotherly love that will make them stand by one another all their lives said missus jo when he had gone"], ["125", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>I was so anxious to hear a mother talk to her boy I couldn't keep away that's another proof it shows me that if I didn't teach my boys anything else I did give them brotherly love that will in a sad hour comfort and divert their sicknesses to the morning<|im_end|>", -0.1063055768609047, 0.6273783445358276, "i was so anxious to hear all about the dear old boy i couldn't keep away that's right comfortable and shows me that if i didn't teach my boys anything else i did give them the brotherly love that will make them stand by one another all their lives said missus jo when he had gone"], ["125", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>I was so anxious to hear all about you, dear old boy, I couldn't keep away that's another proof and shows me that if I didn't teach my boys anything else, I did give them brotherly love that led to the same kind of good and bad comparisons as this stupid boy.<|im_end|>", -0.060284294188022614, 1.0047121047973633, "i was so anxious to hear all about the dear old boy i couldn't keep away that's right comfortable and shows me that if i didn't teach my boys anything else i did give them the brotherly love that will make them stand by one another all their lives said missus jo when he had gone"], ["125", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>I was so anxious to hear all about you to a boy I couldn't keep away that's another proof and shows me that if I didn't teach my boys anything else I did give them brotherly love that when they say I'm a good boy I mean I've been a son of sin since school days<|im_end|>", -0.13280440866947174, 0.4101113975048065, "i was so anxious to hear all about the dear old boy i couldn't keep away that's right comfortable and shows me that if i didn't teach my boys anything else i did give them the brotherly love that will make them stand by one another all their lives said missus jo when he had gone"], ["125", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>I was so anxious to hear a lullaby to a boy I could keep away that's enough of him and shows me that if I didn't teach my boys anything else I did give them brotherly love that made their sad hour more bearable than our sinlessness to you all<|im_end|>", -0.2491731345653534, -0.5440092086791992, "i was so anxious to hear all about the dear old boy i couldn't keep away that's right comfortable and shows me that if i didn't teach my boys anything else i did give them the brotherly love that will make them stand by one another all their lives said missus jo when he had gone"], ["125", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>I was so anxious to hear all about it to a boy I couldn't keep away that's enough of him and shows me that if I didn't teach my boys anything else I did give them brotherly love that will in the same way overcome their own worst tendencies too far<|im_end|>", 0.00731202308088541, 1.558942198753357, "i was so anxious to hear all about the dear old boy i couldn't keep away that's right comfortable and shows me that if i didn't teach my boys anything else i did give them the brotherly love that will make them stand by one another all their lives said missus jo when he had gone"], ["125", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Increased materially and therefore also with powers of resistance may easily be conceived with vast quantities of elastic gases what mass of molten matter accumulated beneath its solid surface lost no exit as practicable after the cooling of the trachy crust<|im_end|>", 0.6219021677970886, 0.48375576734542847, "increased materially and therefore also its powers of resistance it may easily be conceived what vast quantities of elastic gases what masses of molten matter accumulated beneath its solid surface whilst no exit was practicable after the cooling of the trachytic crust"], ["125", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Increased materially and therefore also in the powers of resistance may easily be conceived with vast quantities of elastic gases what mass of molten matter accumulated beneath its solid surface whilst no exit is practicable after the cooling of the tribut crust<|im_end|>", 0.6310301423072815, 0.5756562948226929, "increased materially and therefore also its powers of resistance it may easily be conceived what vast quantities of elastic gases what masses of molten matter accumulated beneath its solid surface whilst no exit was practicable after the cooling of the trachytic crust"], ["125", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Increased materially and therefore also in the power of resistance may easily be conceived with vast quantities of elastic gases what mass of molten matter accumulated beneath its solid surface whilst no exit is practicable after the cooling of the trading crust<|im_end|>", 0.5663049817085266, -0.07599729299545288, "increased materially and therefore also its powers of resistance it may easily be conceived what vast quantities of elastic gases what masses of molten matter accumulated beneath its solid surface whilst no exit was practicable after the cooling of the trachytic crust"], ["125", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Increased materially and therefore also in powers of resistance, it may easily be conceived that vast quantities of elastic gases, what mass of molten matter accumulated beneath its solid surface, whilst no exit is practicable after the cooling of the trivet crust.<|im_end|>", 0.4862109422683716, -0.8823849558830261, "increased materially and therefore also its powers of resistance it may easily be conceived what vast quantities of elastic gases what masses of molten matter accumulated beneath its solid surface whilst no exit was practicable after the cooling of the trachytic crust"], ["125", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Increase materially and therefore also the power of resistance it may easily be conceived with vast quantities of elastic gases what mass of molten matter accumulated beneath its solid surface whilst no exit is practicable after the cooling of the trivet crust<|im_end|>", 0.6143525242805481, 0.407745897769928, "increased materially and therefore also its powers of resistance it may easily be conceived what vast quantities of elastic gases what masses of molten matter accumulated beneath its solid surface whilst no exit was practicable after the cooling of the trachytic crust"], ["125", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Increased materially, and therefore also with powers of resistance may easily be conceived a vast quantities of elastic gases what mass of molten matter accumulated beneath its solid surface whilst no exit is practicable after the cooling of the trigate crust<|im_end|>", 0.6209789514541626, 0.47446081042289734, "increased materially and therefore also its powers of resistance it may easily be conceived what vast quantities of elastic gases what masses of molten matter accumulated beneath its solid surface whilst no exit was practicable after the cooling of the trachytic crust"], ["125", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Increase materially and therefore also in the power of resistance may easily be conceived with vast quantities of elastic gases what mass of impalpable matter accumulated beneath its solid surface whilst no exit is practicable after the cooling of the trading crust<|im_end|>", 0.43219640851020813, -1.4262038469314575, "increased materially and therefore also its powers of resistance it may easily be conceived what vast quantities of elastic gases what masses of molten matter accumulated beneath its solid surface whilst no exit was practicable after the cooling of the trachytic crust"], ["125", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Increased materially and therefore also in powers of resistance may easily be conceived with vast quantities of elastic gases what mass of molten matter accumulated beneath its solid surface whilst no exit is practicable after the cooling of the tributary crust<|im_end|>", 0.6819920539855957, 1.088741421699524, "increased materially and therefore also its powers of resistance it may easily be conceived what vast quantities of elastic gases what masses of molten matter accumulated beneath its solid surface whilst no exit was practicable after the cooling of the trachytic crust"], ["125", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Increased materially, and therefore also with powers of resistance may easily be conceived. With vast quantities of elastic gases, what mass of molten matter accumulated beneath its solid surface? Whilst no exit is practicable after the cooling of the trinity crust.<|im_end|>", 0.3609590530395508, -2.1434223651885986, "increased materially and therefore also its powers of resistance it may easily be conceived what vast quantities of elastic gases what masses of molten matter accumulated beneath its solid surface whilst no exit was practicable after the cooling of the trachytic crust"], ["125", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Increase materially and therefore also in powers of resistance may easily be conceived with vast quantities of elastic gases what mass of molten matter accumulated beneath its solid surface whilst no exit is practicable after the cooling of the trading crust<|im_end|>", 0.6215246319770813, 0.4799547493457794, "increased materially and therefore also its powers of resistance it may easily be conceived what vast quantities of elastic gases what masses of molten matter accumulated beneath its solid surface whilst no exit was practicable after the cooling of the trachytic crust"], ["125", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Increased materially and therefore also with powers of resistance may easily be conceived a vast quantities of elastic gases what mass of molten matter accumulated beneath its solid surface whilst no exit is practicable after the cooling of the tribut crust<|im_end|>", 0.6820893883705139, 1.0897213220596313, "increased materially and therefore also its powers of resistance it may easily be conceived what vast quantities of elastic gases what masses of molten matter accumulated beneath its solid surface whilst no exit was practicable after the cooling of the trachytic crust"], ["125", "<|im_start|>system\n<|im_end|>\n<|im_start|>user\n<|im_end|>\n<|im_start|>assistant\n", "language English<asr_text>Increase materially and therefore also the powers of resistance may easily be conceived with vast quantities of elastic gases what mass of molten matter accumulated beneath its solid surface whilst no exit is practicable after the cooling of the trade at crust<|im_end|>", 0.5666987299919128, -0.07203302532434464, "increased materially and therefore also its powers of resistance it may easily be conceived what vast quantities of elastic gases what masses of molten matter accumulated beneath its solid surface whilst no exit was practicable after the cooling of the trachytic crust"]]}
wandb/run-20260418_172847-c2a5hfz3/files/output.log ADDED
The diff for this file is too large to render. See raw diff
 
wandb/run-20260418_172847-c2a5hfz3/files/requirements.txt ADDED
@@ -0,0 +1,255 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ psutil==7.2.2
2
+ colorama==0.4.6
3
+ typing-inspection==0.4.2
4
+ dill==0.3.8
5
+ aliyun-python-sdk-kms==2.16.5
6
+ urllib3==2.6.3
7
+ torch==2.6.0
8
+ threadpoolctl==3.6.0
9
+ pyzmq==27.1.0
10
+ astor==0.8.1
11
+ hf-xet==1.4.3
12
+ sniffio==1.3.1
13
+ tensorboard==2.20.0
14
+ fastar==0.11.0
15
+ llvmlite==0.43.0
16
+ pathspec==1.0.4
17
+ mkl_fft==1.3.11
18
+ prometheus_client==0.25.0
19
+ async-timeout==5.0.1
20
+ scikit-learn==1.7.2
21
+ sortedcontainers==2.4.0
22
+ Bottleneck==1.4.2
23
+ orjson==3.11.8
24
+ nest-asyncio==1.6.0
25
+ cupy-cuda12x==13.6.0
26
+ semantic-version==2.10.0
27
+ aiosignal==1.4.0
28
+ fsspec==2025.3.0
29
+ dyNET38==2.2
30
+ shellingham==1.5.4
31
+ zstandard==0.25.0
32
+ PyYAML==6.0.3
33
+ nvidia-curand-cu12==10.3.5.147
34
+ gradio==5.50.0
35
+ Werkzeug==3.1.8
36
+ grpcio==1.80.0
37
+ aiohttp==3.13.5
38
+ Flask==3.1.3
39
+ python-json-logger==4.1.0
40
+ trl==0.29.1
41
+ nltk==3.9.4
42
+ platformdirs==4.9.6
43
+ lm-format-enforcer==0.10.12
44
+ pyparsing==3.3.2
45
+ jmespath==0.10.0
46
+ starlette==0.52.1
47
+ crcmod==1.7
48
+ dnspython==2.8.0
49
+ antlr4-python3-runtime==4.9.3
50
+ rouge==1.0.1
51
+ importlib_metadata==9.0.0
52
+ nvidia-cudnn-cu12==9.1.0.70
53
+ safetensors==0.7.0
54
+ blake3==1.0.8
55
+ interegular==0.3.3
56
+ tiktoken==0.11.0
57
+ pydantic_core==2.41.4
58
+ outlines==0.1.11
59
+ airportsdata==20260315
60
+ rich-toolkit==0.19.7
61
+ multiprocess==0.70.16
62
+ sympy==1.13.1
63
+ psutil==7.2.2
64
+ h11==0.16.0
65
+ anyio==4.13.0
66
+ Cython==3.2.4
67
+ outlines_core==0.1.26
68
+ jsonschema==4.26.0
69
+ nvidia-cuda-cupti-cu12==12.4.127
70
+ meson-python==0.19.0
71
+ depyf==0.18.0
72
+ audioread==3.1.0
73
+ typer==0.24.1
74
+ nvidia-cuda-nvrtc-cu12==12.4.127
75
+ joblib==1.5.3
76
+ torchvision==0.21.0
77
+ hf-gradio==0.3.2
78
+ huggingface_hub==0.36.2
79
+ websockets==15.0.1
80
+ diskcache==5.6.3
81
+ mistral_common==1.11.0
82
+ partial-json-parser==0.2.1.1.post7
83
+ simplejson==3.20.2
84
+ watchfiles==1.1.1
85
+ Jinja2==3.1.6
86
+ GitPython==3.1.46
87
+ numexpr==2.11.0
88
+ pydub==0.25.1
89
+ brotli==1.2.0
90
+ binpacking==2.0.1
91
+ cmake==4.3.1
92
+ pydantic==2.12.3
93
+ mkl-service==2.4.0
94
+ protobuf==6.33.6
95
+ gguf==0.10.0
96
+ MarkupSafe==3.0.3
97
+ exceptiongroup==1.3.1
98
+ markdown-it-py==4.0.0
99
+ soxr==1.0.0
100
+ pyarrow==20.0.0
101
+ tqdm==4.67.3
102
+ meson==1.11.0
103
+ fonttools==4.62.1
104
+ annotated-types==0.7.0
105
+ networkx==3.4.2
106
+ nvidia-cuda-runtime-cu12==12.4.127
107
+ compressed-tensors==0.9.2
108
+ wandb==0.23.0
109
+ mdurl==0.1.2
110
+ charset-normalizer==3.4.7
111
+ Pygments==2.20.0
112
+ zipp==3.23.1
113
+ prometheus-fastapi-instrumentator==7.1.0
114
+ aiofiles==24.1.0
115
+ lark==1.2.2
116
+ addict==2.4.0
117
+ pydantic-settings==2.13.1
118
+ opencv-python-headless==4.11.0.86
119
+ certifi==2026.2.25
120
+ sox==1.5.0
121
+ nagisa==0.2.11
122
+ six==1.17.0
123
+ tokenizers==0.22.2
124
+ mkl_random==1.2.8
125
+ fastapi-cloud-cli==0.17.0
126
+ propcache==0.4.1
127
+ cachetools==7.0.5
128
+ rpds-py==0.30.0
129
+ torchaudio==2.6.0
130
+ setuptools==82.0.1
131
+ py-cpuinfo==9.0.0
132
+ tomli==2.4.1
133
+ xxhash==3.6.0
134
+ pip==26.0.1
135
+ contourpy==1.3.2
136
+ absl-py==2.4.0
137
+ mpmath==1.3.0
138
+ ms_swift==4.0.3
139
+ pyproject-metadata==0.11.0
140
+ aiohappyeyeballs==2.6.1
141
+ httpx==0.28.1
142
+ json_repair==0.59.4
143
+ blinker==1.9.0
144
+ tzdata==2025.3
145
+ tensorboard-data-server==0.7.2
146
+ pydantic-extra-types==2.11.1
147
+ Markdown==3.10.2
148
+ nvidia-cusparselt-cu12==0.6.2
149
+ rignore==0.7.6
150
+ openai==2.32.0
151
+ soundfile==0.13.1
152
+ lazy-loader==0.5
153
+ av==14.2.0
154
+ yarl==1.23.0
155
+ python-dateutil==2.9.0.post0
156
+ groovy==0.1.2
157
+ xformers==0.0.29.post2
158
+ qwen-omni-utils==0.0.9
159
+ rich==15.0.0
160
+ xgrammar==0.1.16
161
+ numba==0.60.0
162
+ nvidia-cusolver-cu12==11.6.1.9
163
+ scikit_build_core==0.12.2
164
+ ffmpy==1.0.0
165
+ wheel==0.46.3
166
+ jiter==0.14.0
167
+ oss2==2.19.1
168
+ transformers==4.57.6
169
+ fastrlock==0.8.3
170
+ click==8.3.2
171
+ pooch==1.9.0
172
+ distro==1.9.0
173
+ nvidia-cublas-cu12==12.4.5.8
174
+ regex==2026.4.4
175
+ cpm-kernels==1.0.11
176
+ safehttpx==0.1.7
177
+ matplotlib==3.10.8
178
+ httptools==0.7.1
179
+ nvidia-cusparse-cu12==12.3.1.170
180
+ qwen-asr==0.0.6
181
+ gradio_client==1.14.0
182
+ gitdb==4.0.12
183
+ fastapi-cli==0.0.24
184
+ soynlp==0.0.493
185
+ python-dotenv==1.2.2
186
+ nvidia-cufft-cu12==11.2.1.3
187
+ accelerate==1.12.0
188
+ tomlkit==0.13.3
189
+ triton==3.2.0
190
+ filelock==3.28.0
191
+ pycountry==26.2.16
192
+ modelscope==1.35.4
193
+ annotated-doc==0.0.4
194
+ referencing==0.37.0
195
+ numpy==1.26.4
196
+ aliyun-python-sdk-core==2.16.0
197
+ attrs==26.1.0
198
+ vllm==0.8.0
199
+ python-multipart==0.0.26
200
+ jsonschema-specifications==2025.9.1
201
+ idna==3.11
202
+ scipy==1.15.3
203
+ typing_extensions==4.15.0
204
+ itsdangerous==2.2.0
205
+ msgspec==0.21.1
206
+ msgpack==1.1.2
207
+ nvidia-nvjitlink-cu12==12.4.127
208
+ pycryptodome==3.23.0
209
+ ninja==1.13.0
210
+ pillow==11.3.0
211
+ email-validator==2.3.0
212
+ cryptography==46.0.7
213
+ peft==0.18.1
214
+ kiwisolver==1.5.0
215
+ cffi==2.0.0
216
+ einops==0.8.2
217
+ pytz==2026.1.post1
218
+ uvloop==0.22.1
219
+ requests==2.33.1
220
+ sentencepiece==0.2.1
221
+ attrdict==2.0.1
222
+ dacite==1.9.2
223
+ cloudpickle==3.1.2
224
+ ray==2.55.0
225
+ fastapi==0.135.3
226
+ librosa==0.11.0
227
+ ruff==0.15.10
228
+ multidict==6.7.1
229
+ smmap==5.0.3
230
+ packaging==26.0
231
+ pycparser==3.0
232
+ decorator==5.2.1
233
+ transformers-stream-generator==0.0.5
234
+ nvidia-nccl-cu12==2.21.5
235
+ frozenlist==1.8.0
236
+ uvicorn==0.44.0
237
+ datasets==3.6.0
238
+ cycler==0.12.1
239
+ omegaconf==2.3.0
240
+ httpcore==1.0.9
241
+ pandas==2.3.2
242
+ nvidia-nvtx-cu12==12.4.127
243
+ sentry-sdk==2.58.0
244
+ wheel==0.46.3
245
+ autocommand==2.2.2
246
+ tomli==2.4.0
247
+ packaging==26.0
248
+ more-itertools==10.8.0
249
+ zipp==3.23.0
250
+ platformdirs==4.4.0
251
+ jaraco.context==6.1.0
252
+ jaraco.text==4.0.0
253
+ backports.tarfile==1.2.0
254
+ jaraco.functools==4.4.0
255
+ importlib_metadata==8.7.1
wandb/run-20260418_172847-c2a5hfz3/files/wandb-metadata.json ADDED
@@ -0,0 +1,213 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "os": "Linux-3.10.0-957.el7.x86_64-x86_64-with-glibc2.17",
3
+ "python": "CPython 3.10.18",
4
+ "startedAt": "2026-04-18T09:28:47.432340Z",
5
+ "args": [
6
+ "--rlhf_type",
7
+ "grpo",
8
+ "--external_plugins",
9
+ "/mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/0416upload/my_qwen3_asr_dapo_register.py",
10
+ "/mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/0416upload/0417_reward.py",
11
+ "--model",
12
+ "/mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/qwen3-asr-merged",
13
+ "--model_type",
14
+ "my_qwen3_asr_rl",
15
+ "--template",
16
+ "my_qwen3_asr_rl",
17
+ "--dataset",
18
+ "/mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/0416upload/lora_0323_10w+55w+error+syn_with_domain_train90_targeted_rl_train90_loramerged_basewer_3suppress_server.jsonl",
19
+ "--val_dataset",
20
+ "/mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/0416upload/lora_0323_10w+55w+error+syn_with_domain_train90_targeted_rl_val5_sample5p_server.jsonl",
21
+ "--reward_funcs",
22
+ "asr_wer_sub_len_cmp_hallu_dirty_v56",
23
+ "--train_type",
24
+ "lora",
25
+ "--use_vllm",
26
+ "false",
27
+ "--log_completions",
28
+ "true",
29
+ "--loss_type",
30
+ "dapo",
31
+ "--advantage_estimator",
32
+ "grpo",
33
+ "--scale_rewards",
34
+ "group",
35
+ "--num_iterations",
36
+ "2",
37
+ "--beta",
38
+ "0.04",
39
+ "--epsilon_high",
40
+ "0.28",
41
+ "--dynamic_sample",
42
+ "true",
43
+ "--max_resample_times",
44
+ "4",
45
+ "--overlong_filter",
46
+ "true",
47
+ "--truncation_strategy",
48
+ "delete",
49
+ "--num_generations",
50
+ "12",
51
+ "--generation_batch_size",
52
+ "48",
53
+ "--per_device_train_batch_size",
54
+ "4",
55
+ "--per_device_eval_batch_size",
56
+ "4",
57
+ "--gradient_accumulation_steps",
58
+ "12",
59
+ "--num_generations_eval",
60
+ "4",
61
+ "--max_completion_length",
62
+ "256",
63
+ "--temperature",
64
+ "0.50",
65
+ "--top_p",
66
+ "0.95",
67
+ "--top_k",
68
+ "50",
69
+ "--repetition_penalty",
70
+ "1.08",
71
+ "--learning_rate",
72
+ "5e-5",
73
+ "--lr_scheduler_type",
74
+ "cosine",
75
+ "--warmup_ratio",
76
+ "0.03",
77
+ "--report_to",
78
+ "wandb",
79
+ "--run_name",
80
+ "qwen3asr_dapo_reward56_4x4x12_12gen_4GPU",
81
+ "--output_dir",
82
+ "/mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/0416upload/out/qwen3asr_dapo_reward56_4x4x12_12gen_4GPU",
83
+ "--save_strategy",
84
+ "steps",
85
+ "--save_steps",
86
+ "20",
87
+ "--logging_steps",
88
+ "5",
89
+ "--freeze_llm",
90
+ "false",
91
+ "--freeze_vit",
92
+ "false",
93
+ "--freeze_aligner",
94
+ "false",
95
+ "--remove_unused_columns",
96
+ "false",
97
+ "--padding_side",
98
+ "left"
99
+ ],
100
+ "program": "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/lib/python3.10/site-packages/swift/cli/rlhf.py",
101
+ "email": "pang_kaiyu@163.com",
102
+ "root": "/mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/0416upload",
103
+ "host": "SH-IDC1-10-140-37-95",
104
+ "executable": "/mnt/petrelfs/panjiabao/conda_envs/qwen3-asr_v2/bin/python3.10",
105
+ "cpu_count": 64,
106
+ "cpu_count_logical": 128,
107
+ "gpu": "NVIDIA A100-SXM4-80GB",
108
+ "gpu_count": 8,
109
+ "disk": {
110
+ "/": {
111
+ "total": "524945911808",
112
+ "used": "37368901632"
113
+ }
114
+ },
115
+ "memory": {
116
+ "total": "1081627828224"
117
+ },
118
+ "gpu_nvidia": [
119
+ {
120
+ "name": "NVIDIA A100-SXM4-80GB",
121
+ "memoryTotal": "85899345920",
122
+ "cudaCores": 6912,
123
+ "architecture": "Ampere",
124
+ "uuid": "GPU-87e7e3ab-b254-fc22-7407-8e2e88e9d854"
125
+ },
126
+ {
127
+ "name": "NVIDIA A100-SXM4-80GB",
128
+ "memoryTotal": "85899345920",
129
+ "cudaCores": 6912,
130
+ "architecture": "Ampere",
131
+ "uuid": "GPU-976db8a1-cf00-11c6-caaa-413862233fd4"
132
+ },
133
+ {
134
+ "name": "NVIDIA A100-SXM4-80GB",
135
+ "memoryTotal": "85899345920",
136
+ "cudaCores": 6912,
137
+ "architecture": "Ampere",
138
+ "uuid": "GPU-78b37ae8-44e0-e318-a6c0-f6f4ac78d46a"
139
+ },
140
+ {
141
+ "name": "NVIDIA A100-SXM4-80GB",
142
+ "memoryTotal": "85899345920",
143
+ "cudaCores": 6912,
144
+ "architecture": "Ampere",
145
+ "uuid": "GPU-840b937d-a7d4-68e7-ad57-f4568e01c3ae"
146
+ },
147
+ {
148
+ "name": "NVIDIA A100-SXM4-80GB",
149
+ "memoryTotal": "85899345920",
150
+ "cudaCores": 6912,
151
+ "architecture": "Ampere",
152
+ "uuid": "GPU-a9d0de54-f5b5-f83b-7bda-f53db844622d"
153
+ },
154
+ {
155
+ "name": "NVIDIA A100-SXM4-80GB",
156
+ "memoryTotal": "85899345920",
157
+ "cudaCores": 6912,
158
+ "architecture": "Ampere",
159
+ "uuid": "GPU-cb7d22e9-305c-c68c-64f1-599580742db0"
160
+ },
161
+ {
162
+ "name": "NVIDIA A100-SXM4-80GB",
163
+ "memoryTotal": "85899345920",
164
+ "cudaCores": 6912,
165
+ "architecture": "Ampere",
166
+ "uuid": "GPU-8d9704bb-4592-346f-a7f2-1a6ed8d58619"
167
+ },
168
+ {
169
+ "name": "NVIDIA A100-SXM4-80GB",
170
+ "memoryTotal": "85899345920",
171
+ "cudaCores": 6912,
172
+ "architecture": "Ampere",
173
+ "uuid": "GPU-3892f01b-e0b8-a9d9-0587-b5a7d2d9b5ab"
174
+ }
175
+ ],
176
+ "cudaVersion": "12.4",
177
+ "slurm": {
178
+ "cluster_name": "cluster_sproject3",
179
+ "conf": "/etc/slurm/slurm.conf",
180
+ "cpus_on_node": "2",
181
+ "gtids": "0",
182
+ "job_account": "research",
183
+ "job_cpus_per_node": "2",
184
+ "job_gid": "800000689",
185
+ "job_gpus": "0,1,2,6",
186
+ "job_id": "8574598",
187
+ "job_name": "qwen3_asr_train_4gpu",
188
+ "job_nodelist": "SH-IDC1-10-140-37-95",
189
+ "job_num_nodes": "1",
190
+ "job_partition": "interntmp",
191
+ "job_qos": "normal",
192
+ "job_uid": "800000689",
193
+ "job_user": "panjiabao",
194
+ "jobid": "8574598",
195
+ "localid": "0",
196
+ "nnodes": "1",
197
+ "node_aliases": "(null)",
198
+ "nodeid": "0",
199
+ "nodelist": "SH-IDC1-10-140-37-95",
200
+ "nprocs": "1",
201
+ "ntasks": "1",
202
+ "prio_process": "0",
203
+ "procid": "0",
204
+ "submit_dir": "/mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/0416upload",
205
+ "submit_host": "SH-IDC1-10-140-37-164",
206
+ "task_pid": "9466",
207
+ "tasks_per_node": "1",
208
+ "topology_addr": "SH-IDC1-10-140-37-95",
209
+ "topology_addr_pattern": "node",
210
+ "working_cluster": "cluster_sproject3:SH-IDC1-10-140-37-161:6817:9216:109"
211
+ },
212
+ "writerId": "ess1zs9oqcfvbaak4xbqvnst142xqp1g"
213
+ }
wandb/run-20260418_172847-c2a5hfz3/files/wandb-summary.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"train/completions/max_length":374.1,"eval/kl":0.5471468614941498,"profiling/Time taken: GRPOTrainer.resample_encode_failed_inputs":0.10830203304067254,"profiling/Time taken: GRPOTrainer.generate":2.985434970119968,"eval/clip_ratio/region_mean":0,"train/reward_std":0.18413368090987206,"profiling/Time taken: GRPOTrainer._prepare_batch_inputs":1.4252209290862083,"eval/loss":0.023608719930052757,"train/clip_ratio/low_min":0.002832426130771637,"eval/frac_reward_zero_std":0.15566037735849056,"eval/rewards/ASRWerSubLenCmpHalluDirtyV56/std":0.5037064297862772,"train/clip_ratio/high_mean":0.013257157216624666,"eval/samples_per_second":1.028,"_wandb":{"runtime":167801},"train/global_step":1200,"train/kl":0.7693365861972173,"eval/steps_per_second":0.067,"eval/runtime":208.2116,"profiling/Time taken: GRPOTrainer.compute_loss":0.3779073969926685,"train/rewards/ASRWerSubLenCmpHalluDirtyV56/mean":0.16251326091587542,"eval/reward_std":0.1169186263643908,"profiling/Time taken: GRPOTrainer._generate_and_score_completions":5.926984405843541,"eval/clip_ratio/low_mean":0,"eval/clip_ratio/high_mean":0,"train/clip_ratio/high_max":0.028729480388574303,"profiling/Time taken: GRPOTrainer.ASRWerSubLenCmpHalluDirtyV56":0.06905108108185232,"profiling/Time taken: GRPOTrainer.log_metrics":0.022023104829713702,"train/clip_ratio/region_mean":0.028791408023486533,"train/frac_reward_zero_std":0,"eval/reward":0.4663126377283402,"eval/completions/mean_length":45.948113207547166,"train/completions/clipped_ratio":0.004166666666666667,"eval/clip_ratio/low_min":0,"eval/completions/clipped_ratio":0,"profiling/Time taken: GRPOTrainer._get_per_token_logps_and_entropies":0.3741553670261055,"train/clip_ratio/low_mean":0.015534250618657097,"eval/clip_ratio/high_max":0,"_step":598,"train/learning_rate":4.87350326370979e-05,"train/step_time":50.95165289340075,"eval/completions/max_length":59.15094339622642,"completions":{"size":31217,"ncols":6,"artifact_path":"wandb-client-artifact://jli2kdi7ef7w5pgm5t5mfpancx9qoq5net2vqru9ku5vuevkioj6uoqgmy6ojheyps4eavp8glqspzt63cid5rz59ib1yfz438dry4cbc1rcrle1x0kc6u6baofnvzp5/completions.table.json","_type":"table-file","sha256":"15ac642a65a06a04c3f33750733a3b61b5c428d4f70e069739b3c7df835ae44d","_latest_artifact_path":"wandb-client-artifact://mm4npojrnrffcjkkzw46vtbqn9bp7hms1vx6ohyncuuv16yny2waqf8rilfjn20oz6zu5pl07fwb5wqd7m6kprccayx2errp2xqtifzi27gnfukness54t79wm4t5agy:latest/completions.table.json","log_mode":"IMMUTABLE","nrows":48,"path":"media/table/completions_597_15ac642a65a06a04c3f3.table.json"},"profiling/Time taken: GRPOTrainer._score_completions":0.06985888280905783,"train/reward":0.1625132780522108,"_runtime":167801,"_timestamp":1.776672310555167e+09,"train/grad_norm":0.4121144711971283,"train/rewards/ASRWerSubLenCmpHalluDirtyV56/std":0.43018959313631056,"eval/rewards/ASRWerSubLenCmpHalluDirtyV56/mean":0.4663126377283402,"train/completions/mean_length":52.735418701171874,"train/completions/min_length":29.85,"train/epoch":0.3859761981344484,"train/loss":0.01593678444623947,"profiling/Time taken: GRPOTrainer._dynamic_sampling":1.2856517911422998,"eval/completions/min_length":30.39622641509434,"profiling/Time taken: GRPOTrainer._prepare_inputs":6.024027243256569e-06}
wandb/run-20260418_172847-c2a5hfz3/logs/debug-internal.log ADDED
@@ -0,0 +1,72 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {"time":"2026-04-18T17:28:47.877484976+08:00","level":"INFO","msg":"stream: starting","core version":"0.23.0"}
2
+ {"time":"2026-04-18T17:28:48.347618035+08:00","level":"INFO","msg":"stream: created new stream","id":"c2a5hfz3"}
3
+ {"time":"2026-04-18T17:28:48.347701352+08:00","level":"INFO","msg":"handler: started","stream_id":"c2a5hfz3"}
4
+ {"time":"2026-04-18T17:28:48.350844585+08:00","level":"INFO","msg":"stream: started","id":"c2a5hfz3"}
5
+ {"time":"2026-04-18T17:28:48.350849894+08:00","level":"INFO","msg":"writer: started","stream_id":"c2a5hfz3"}
6
+ {"time":"2026-04-18T17:28:48.350854798+08:00","level":"INFO","msg":"sender: started","stream_id":"c2a5hfz3"}
7
+ {"time":"2026-04-18T17:37:33.858258418+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/pang_kaiyu-none/qwen3_asr_swift_dapo/c2a5hfz3/file_stream\": unexpected EOF"}
8
+ {"time":"2026-04-19T02:34:07.470718868+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/pang_kaiyu-none/qwen3_asr_swift_dapo/c2a5hfz3/file_stream\": unexpected EOF"}
9
+ {"time":"2026-04-19T02:38:39.32386773+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/pang_kaiyu-none/qwen3_asr_swift_dapo/c2a5hfz3/file_stream\": http2: client conn could not be established"}
10
+ {"time":"2026-04-19T02:40:17.658933776+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/pang_kaiyu-none/qwen3_asr_swift_dapo/c2a5hfz3/file_stream\": unexpected EOF"}
11
+ {"time":"2026-04-19T02:43:03.564180775+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/pang_kaiyu-none/qwen3_asr_swift_dapo/c2a5hfz3/file_stream\": unexpected EOF"}
12
+ {"time":"2026-04-19T02:44:49.518795314+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/pang_kaiyu-none/qwen3_asr_swift_dapo/c2a5hfz3/file_stream\": unexpected EOF"}
13
+ {"time":"2026-04-19T02:45:08.529740538+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/pang_kaiyu-none/qwen3_asr_swift_dapo/c2a5hfz3/file_stream\": unexpected EOF"}
14
+ {"time":"2026-04-19T02:46:20.848321936+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/pang_kaiyu-none/qwen3_asr_swift_dapo/c2a5hfz3/file_stream\": unexpected EOF"}
15
+ {"time":"2026-04-19T02:49:05.639172159+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/pang_kaiyu-none/qwen3_asr_swift_dapo/c2a5hfz3/file_stream\": unexpected EOF"}
16
+ {"time":"2026-04-19T15:09:49.426045163+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/pang_kaiyu-none/qwen3_asr_swift_dapo/c2a5hfz3/file_stream\": unexpected EOF"}
17
+ {"time":"2026-04-19T15:57:04.347389276+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/pang_kaiyu-none/qwen3_asr_swift_dapo/c2a5hfz3/file_stream\": unexpected EOF"}
18
+ {"time":"2026-04-19T16:02:30.488210102+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/pang_kaiyu-none/qwen3_asr_swift_dapo/c2a5hfz3/file_stream\": unexpected EOF"}
19
+ {"time":"2026-04-19T22:07:33.03303113+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/pang_kaiyu-none/qwen3_asr_swift_dapo/c2a5hfz3/file_stream\": unexpected EOF"}
20
+ {"time":"2026-04-19T22:07:51.98901393+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/pang_kaiyu-none/qwen3_asr_swift_dapo/c2a5hfz3/file_stream\": unexpected EOF"}
21
+ {"time":"2026-04-19T22:08:16.035247515+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/pang_kaiyu-none/qwen3_asr_swift_dapo/c2a5hfz3/file_stream\": unexpected EOF"}
22
+ {"time":"2026-04-19T22:09:42.186767689+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/pang_kaiyu-none/qwen3_asr_swift_dapo/c2a5hfz3/file_stream\": unexpected EOF"}
23
+ {"time":"2026-04-19T22:24:00.480169619+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/pang_kaiyu-none/qwen3_asr_swift_dapo/c2a5hfz3/file_stream\": unexpected EOF"}
24
+ {"time":"2026-04-19T22:24:34.690158146+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/pang_kaiyu-none/qwen3_asr_swift_dapo/c2a5hfz3/file_stream\": unexpected EOF"}
25
+ {"time":"2026-04-19T22:28:36.622066809+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/pang_kaiyu-none/qwen3_asr_swift_dapo/c2a5hfz3/file_stream\": unexpected EOF"}
26
+ {"time":"2026-04-19T22:28:59.75540152+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/pang_kaiyu-none/qwen3_asr_swift_dapo/c2a5hfz3/file_stream\": unexpected EOF"}
27
+ {"time":"2026-04-19T22:31:22.975036457+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/pang_kaiyu-none/qwen3_asr_swift_dapo/c2a5hfz3/file_stream\": unexpected EOF"}
28
+ {"time":"2026-04-19T22:34:17.890202383+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/pang_kaiyu-none/qwen3_asr_swift_dapo/c2a5hfz3/file_stream\": unexpected EOF"}
29
+ {"time":"2026-04-19T22:43:21.155119859+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/pang_kaiyu-none/qwen3_asr_swift_dapo/c2a5hfz3/file_stream\": unexpected EOF"}
30
+ {"time":"2026-04-19T22:43:38.33530735+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/pang_kaiyu-none/qwen3_asr_swift_dapo/c2a5hfz3/file_stream\": unexpected EOF"}
31
+ {"time":"2026-04-19T22:46:03.44895843+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/pang_kaiyu-none/qwen3_asr_swift_dapo/c2a5hfz3/file_stream\": unexpected EOF"}
32
+ {"time":"2026-04-19T22:48:50.248056745+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/pang_kaiyu-none/qwen3_asr_swift_dapo/c2a5hfz3/file_stream\": unexpected EOF"}
33
+ {"time":"2026-04-19T22:49:48.447601198+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/pang_kaiyu-none/qwen3_asr_swift_dapo/c2a5hfz3/file_stream\": unexpected EOF"}
34
+ {"time":"2026-04-19T22:52:35.56119014+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/pang_kaiyu-none/qwen3_asr_swift_dapo/c2a5hfz3/file_stream\": unexpected EOF"}
35
+ {"time":"2026-04-19T22:52:50.371922946+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/pang_kaiyu-none/qwen3_asr_swift_dapo/c2a5hfz3/file_stream\": unexpected EOF"}
36
+ {"time":"2026-04-19T22:56:30.747794336+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/pang_kaiyu-none/qwen3_asr_swift_dapo/c2a5hfz3/file_stream\": unexpected EOF"}
37
+ {"time":"2026-04-19T22:58:32.547706574+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/pang_kaiyu-none/qwen3_asr_swift_dapo/c2a5hfz3/file_stream\": unexpected EOF"}
38
+ {"time":"2026-04-19T23:00:23.617563694+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/pang_kaiyu-none/qwen3_asr_swift_dapo/c2a5hfz3/file_stream\": unexpected EOF"}
39
+ {"time":"2026-04-19T23:00:37.717734501+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/pang_kaiyu-none/qwen3_asr_swift_dapo/c2a5hfz3/file_stream\": unexpected EOF"}
40
+ {"time":"2026-04-19T23:05:31.94573349+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/pang_kaiyu-none/qwen3_asr_swift_dapo/c2a5hfz3/file_stream\": unexpected EOF"}
41
+ {"time":"2026-04-19T23:05:44.893259249+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/pang_kaiyu-none/qwen3_asr_swift_dapo/c2a5hfz3/file_stream\": unexpected EOF"}
42
+ {"time":"2026-04-20T00:03:04.382543732+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/pang_kaiyu-none/qwen3_asr_swift_dapo/c2a5hfz3/file_stream\": unexpected EOF"}
43
+ {"time":"2026-04-20T00:03:19.501053157+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/pang_kaiyu-none/qwen3_asr_swift_dapo/c2a5hfz3/file_stream\": unexpected EOF"}
44
+ {"time":"2026-04-20T00:05:31.556601347+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/pang_kaiyu-none/qwen3_asr_swift_dapo/c2a5hfz3/file_stream\": unexpected EOF"}
45
+ {"time":"2026-04-20T00:06:03.495128433+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/pang_kaiyu-none/qwen3_asr_swift_dapo/c2a5hfz3/file_stream\": unexpected EOF"}
46
+ {"time":"2026-04-20T00:11:23.73287074+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/pang_kaiyu-none/qwen3_asr_swift_dapo/c2a5hfz3/file_stream\": unexpected EOF"}
47
+ {"time":"2026-04-20T02:58:43.522847172+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/graphql\": net/http: request canceled (Client.Timeout exceeded while awaiting headers)"}
48
+ {"time":"2026-04-20T02:59:04.598457045+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/pang_kaiyu-none/qwen3_asr_swift_dapo/c2a5hfz3/file_stream\": context deadline exceeded"}
49
+ {"time":"2026-04-20T02:59:15.733502761+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/graphql\": context deadline exceeded (Client.Timeout exceeded while awaiting headers)"}
50
+ {"time":"2026-04-20T02:59:49.917399553+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/graphql\": context deadline exceeded (Client.Timeout exceeded while awaiting headers)"}
51
+ {"time":"2026-04-20T03:00:07.058218433+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/pang_kaiyu-none/qwen3_asr_swift_dapo/c2a5hfz3/file_stream\": context deadline exceeded"}
52
+ {"time":"2026-04-20T03:00:29.606621937+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/graphql\": net/http: request canceled (Client.Timeout exceeded while awaiting headers)"}
53
+ {"time":"2026-04-20T03:00:34.624296643+08:00","level":"INFO","msg":"flowcontrol: backed up, offloading to disk","recordNumber":124381}
54
+ {"time":"2026-04-20T03:00:46.264621657+08:00","level":"INFO","msg":"flowcontrol: unblocked","totalOffloaded":1}
55
+ {"time":"2026-04-20T03:44:43.734398398+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/graphql\": context deadline exceeded (Client.Timeout exceeded while awaiting headers)"}
56
+ {"time":"2026-04-20T04:11:48.762158534+08:00","level":"INFO","msg":"api: retrying HTTP error","status":503,"url":"https://api.wandb.ai/graphql","body":"upstream connect error or disconnect/reset before headers. reset reason: connection termination"}
57
+ {"time":"2026-04-20T04:13:58.74920069+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/graphql\": net/http: request canceled (Client.Timeout exceeded while awaiting headers)"}
58
+ {"time":"2026-04-20T06:34:34.21211755+08:00","level":"INFO","msg":"api: retrying HTTP error","status":503,"url":"https://api.wandb.ai/graphql","body":"upstream connect error or disconnect/reset before headers. reset reason: connection termination"}
59
+ {"time":"2026-04-20T10:50:53.628901466+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/pang_kaiyu-none/qwen3_asr_swift_dapo/c2a5hfz3/file_stream\": unexpected EOF"}
60
+ {"time":"2026-04-20T16:00:42.158363018+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/pang_kaiyu-none/qwen3_asr_swift_dapo/c2a5hfz3/file_stream\": unexpected EOF"}
61
+ {"time":"2026-04-20T16:02:08.101875007+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/pang_kaiyu-none/qwen3_asr_swift_dapo/c2a5hfz3/file_stream\": unexpected EOF"}
62
+ {"time":"2026-04-20T16:03:45.141714956+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/pang_kaiyu-none/qwen3_asr_swift_dapo/c2a5hfz3/file_stream\": unexpected EOF"}
63
+ {"time":"2026-04-20T16:04:52.17332644+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/pang_kaiyu-none/qwen3_asr_swift_dapo/c2a5hfz3/file_stream\": unexpected EOF"}
64
+ {"time":"2026-04-20T16:05:06.320377956+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/pang_kaiyu-none/qwen3_asr_swift_dapo/c2a5hfz3/file_stream\": unexpected EOF"}
65
+ {"time":"2026-04-20T16:05:29.800728083+08:00","level":"ERROR","msg":"sender: sendStopStatus: failed to get run stopped status: context deadline exceeded (Client.Timeout or context cancellation while reading body)"}
66
+ {"time":"2026-04-20T16:05:30.799799131+08:00","level":"INFO","msg":"stream: closing","id":"c2a5hfz3"}
67
+ {"time":"2026-04-20T16:05:39.191906442+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/pang_kaiyu-none/qwen3_asr_swift_dapo/c2a5hfz3/file_stream\": unexpected EOF"}
68
+ {"time":"2026-04-20T16:05:43.710909983+08:00","level":"INFO","msg":"fileTransfer: Close: file transfer manager closed"}
69
+ {"time":"2026-04-20T16:06:10.469686843+08:00","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/files/pang_kaiyu-none/qwen3_asr_swift_dapo/c2a5hfz3/file_stream\": unexpected EOF"}
70
+ {"time":"2026-04-20T16:06:17.397266507+08:00","level":"INFO","msg":"handler: closed","stream_id":"c2a5hfz3"}
71
+ {"time":"2026-04-20T16:06:17.400263519+08:00","level":"INFO","msg":"sender: closed","stream_id":"c2a5hfz3"}
72
+ {"time":"2026-04-20T16:06:17.40028542+08:00","level":"INFO","msg":"stream: closed","id":"c2a5hfz3"}
wandb/run-20260418_172847-c2a5hfz3/logs/debug.log ADDED
@@ -0,0 +1,26 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ 2026-04-18 17:28:47,491 INFO MainThread:10295 [wandb_setup.py:_flush():80] Current SDK version is 0.23.0
2
+ 2026-04-18 17:28:47,491 INFO MainThread:10295 [wandb_setup.py:_flush():80] Configure stats pid to 10295
3
+ 2026-04-18 17:28:47,491 INFO MainThread:10295 [wandb_setup.py:_flush():80] Loading settings from /mnt/petrelfs/panjiabao/.config/wandb/settings
4
+ 2026-04-18 17:28:47,491 INFO MainThread:10295 [wandb_setup.py:_flush():80] Loading settings from /mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/0416upload/wandb/settings
5
+ 2026-04-18 17:28:47,491 INFO MainThread:10295 [wandb_setup.py:_flush():80] Loading settings from environment variables
6
+ 2026-04-18 17:28:47,491 INFO MainThread:10295 [wandb_init.py:setup_run_log_directory():713] Logging user logs to /mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/0416upload/wandb/run-20260418_172847-c2a5hfz3/logs/debug.log
7
+ 2026-04-18 17:28:47,491 INFO MainThread:10295 [wandb_init.py:setup_run_log_directory():714] Logging internal logs to /mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/0416upload/wandb/run-20260418_172847-c2a5hfz3/logs/debug-internal.log
8
+ 2026-04-18 17:28:47,491 INFO MainThread:10295 [wandb_init.py:init():840] calling init triggers
9
+ 2026-04-18 17:28:47,491 INFO MainThread:10295 [wandb_init.py:init():845] wandb.init called with sweep_config: {}
10
+ config: {'_wandb': {}}
11
+ 2026-04-18 17:28:47,491 INFO MainThread:10295 [wandb_init.py:init():888] starting backend
12
+ 2026-04-18 17:28:47,865 INFO MainThread:10295 [wandb_init.py:init():891] sending inform_init request
13
+ 2026-04-18 17:28:47,870 INFO MainThread:10295 [wandb_init.py:init():899] backend started and connected
14
+ 2026-04-18 17:28:47,874 INFO MainThread:10295 [wandb_init.py:init():969] updated telemetry
15
+ 2026-04-18 17:28:47,875 INFO MainThread:10295 [wandb_init.py:init():993] communicating run to backend with 90.0 second timeout
16
+ 2026-04-18 17:28:49,589 INFO MainThread:10295 [wandb_init.py:init():1040] starting run threads in backend
17
+ 2026-04-18 17:28:50,217 INFO MainThread:10295 [wandb_run.py:_console_start():2504] atexit reg
18
+ 2026-04-18 17:28:50,218 INFO MainThread:10295 [wandb_run.py:_redirect():2352] redirect: wrap_raw
19
+ 2026-04-18 17:28:50,218 INFO MainThread:10295 [wandb_run.py:_redirect():2421] Wrapping output streams.
20
+ 2026-04-18 17:28:50,218 INFO MainThread:10295 [wandb_run.py:_redirect():2444] Redirects installed.
21
+ 2026-04-18 17:28:50,224 INFO MainThread:10295 [wandb_init.py:init():1080] run started, returning control to user process
22
+ 2026-04-18 17:28:50,229 INFO MainThread:10295 [wandb_run.py:_config_callback():1385] config_cb None None {'peft_config': {'default': {'task_type': 'CAUSAL_LM', 'peft_type': 'LORA', 'auto_mapping': None, 'peft_version': '0.18.1', 'base_model_name_or_path': '/mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/qwen3-asr-merged', 'revision': None, 'inference_mode': False, 'r': 8, 'target_modules': '^(thinker\\.model(?=\\.).*\\.(up_proj|q_proj|o_proj|gate_proj|k_proj|v_proj|down_proj)|thinker\\.audio_tower\\.layers(?=\\.).*\\.(q_proj|fc1|out_proj|k_proj|v_proj|fc2)|thinker\\.audio_tower\\.conv_out(?=\\.)|thinker\\.audio_tower\\.proj1(?=\\.)|thinker\\.audio_tower\\.proj2(?=\\.))$', 'exclude_modules': None, 'lora_alpha': 32, 'lora_dropout': 0.05, 'fan_in_fan_out': False, 'bias': 'none', 'use_rslora': False, 'modules_to_save': [], 'init_lora_weights': True, 'layers_to_transform': None, 'layers_pattern': None, 'rank_pattern': {}, 'alpha_pattern': {}, 'megatron_config': None, 'megatron_core': 'megatron.core', 'trainable_token_indices': None, 'loftq_config': {}, 'eva_config': None, 'corda_config': None, 'use_dora': False, 'alora_invocation_tokens': None, 'use_qalora': False, 'qalora_group_size': 16, 'layer_replication': None, 'runtime_config': {'ephemeral_gpu_offload': False}, 'lora_bias': False, 'target_parameters': None, 'arrow_config': None, 'ensure_weight_tying': False, 'lora_dtype': None, 'lorap_lr_ratio': None, 'lorap_emb_lr': 1e-06}}, 'return_dict': True, 'output_hidden_states': False, 'torchscript': False, 'dtype': 'bfloat16', 'pruned_heads': {}, 'tie_word_embeddings': True, 'chunk_size_feed_forward': 0, 'is_encoder_decoder': False, 'is_decoder': False, 'cross_attention_hidden_size': None, 'add_cross_attention': False, 'tie_encoder_decoder': False, 'architectures': ['Qwen3ASRForConditionalGeneration'], 'finetuning_task': None, 'id2label': {0: 'LABEL_0', 1: 'LABEL_1'}, 'label2id': {'LABEL_0': 0, 'LABEL_1': 1}, 'task_specific_params': None, 'problem_type': None, 'tokenizer_class': None, 'prefix': None, 'bos_token_id': None, 'pad_token_id': 151643, 'eos_token_id': 151645, 'sep_token_id': None, 'decoder_start_token_id': None, 'max_length': 20, 'min_length': 0, 'do_sample': False, 'early_stopping': False, 'num_beams': 1, 'temperature': 0.5, 'top_k': 50, 'top_p': 0.95, 'typical_p': 1.0, 'repetition_penalty': 1.08, 'length_penalty': 1.0, 'no_repeat_ngram_size': 0, 'encoder_no_repeat_ngram_size': 0, 'bad_words_ids': None, 'num_return_sequences': 1, 'output_scores': False, 'return_dict_in_generate': False, 'forced_bos_token_id': None, 'forced_eos_token_id': None, 'remove_invalid_values': False, 'exponential_decay_length_penalty': None, 'suppress_tokens': None, 'begin_suppress_tokens': None, 'num_beam_groups': 1, 'diversity_penalty': 0.0, '_name_or_path': '/mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/qwen3-asr-merged', 'transformers_version': '4.57.6', 'model_type': 'qwen3_asr', 'tf_legacy_loss': False, 'use_bfloat16': False, 'thinker_config': {'return_dict': True, 'output_hidden_states': False, 'torchscript': False, 'dtype': 'bfloat16', 'pruned_heads': {}, 'tie_word_embeddings': True, 'chunk_size_feed_forward': 0, 'is_encoder_decoder': False, 'is_decoder': False, 'cross_attention_hidden_size': None, 'add_cross_attention': False, 'tie_encoder_decoder': False, 'architectures': ['Qwen3ASRForConditionalGeneration'], 'finetuning_task': None, 'id2label': {0: 'LABEL_0', 1: 'LABEL_1'}, 'label2id': {'LABEL_0': 0, 'LABEL_1': 1}, 'task_specific_params': None, 'problem_type': None, 'tokenizer_class': None, 'prefix': None, 'bos_token_id': None, 'pad_token_id': None, 'eos_token_id': None, 'sep_token_id': None, 'decoder_start_token_id': None, 'max_length': 20, 'min_length': 0, 'do_sample': False, 'early_stopping': False, 'num_beams': 1, 'temperature': 1.0, 'top_k': 50, 'top_p': 1.0, 'typical_p': 1.0, 'repetition_penalty': 1.0, 'length_penalty': 1.0, 'no_repeat_ngram_size': 0, 'encoder_no_repeat_ngram_size': 0, 'bad_words_ids': None, 'num_return_sequences': 1, 'output_scores': False, 'return_dict_in_generate': False, 'forced_bos_token_id': None, 'forced_eos_token_id': None, 'remove_invalid_values': False, 'exponential_decay_length_penalty': None, 'suppress_tokens': None, 'begin_suppress_tokens': None, 'num_beam_groups': 1, 'diversity_penalty': 0.0, '_name_or_path': '', 'audio_end_token_id': 151670, 'model_type': 'qwen3_asr_thinker', 'tf_legacy_loss': False, 'use_bfloat16': False, 'user_token_id': 872, 'audio_start_token_id': 151669, 'initializer_range': 0.02, 'audio_config': {'return_dict': True, 'output_hidden_states': False, 'torchscript': False, 'dtype': None, 'pruned_heads': {}, 'tie_word_embeddings': True, 'chunk_size_feed_forward': 0, 'is_encoder_decoder': False, 'is_decoder': False, 'cross_attention_hidden_size': None, 'add_cross_attention': False, 'tie_encoder_decoder': False, 'architectures': None, 'finetuning_task': None, 'id2label': {0: 'LABEL_0', 1: 'LABEL_1'}, 'label2id': {'LABEL_0': 0, 'LABEL_1': 1}, 'task_specific_params': None, 'problem_type': None, 'tokenizer_class': None, 'prefix': None, 'bos_token_id': None, 'pad_token_id': None, 'eos_token_id': None, 'sep_token_id': None, 'decoder_start_token_id': None, 'max_length': 20, 'min_length': 0, 'do_sample': False, 'early_stopping': False, 'num_beams': 1, 'temperature': 1.0, 'top_k': 50, 'top_p': 1.0, 'typical_p': 1.0, 'repetition_penalty': 1.0, 'length_penalty': 1.0, 'no_repeat_ngram_size': 0, 'encoder_no_repeat_ngram_size': 0, 'bad_words_ids': None, 'num_return_sequences': 1, 'output_scores': False, 'return_dict_in_generate': False, 'forced_bos_token_id': None, 'forced_eos_token_id': None, 'remove_invalid_values': False, 'exponential_decay_length_penalty': None, 'suppress_tokens': None, 'begin_suppress_tokens': None, 'num_beam_groups': 1, 'diversity_penalty': 0.0, '_name_or_path': '', 'model_type': 'qwen3_asr_audio_encoder', 'num_hidden_layers': 24, 'tf_legacy_loss': False, 'use_bfloat16': False, 'num_mel_bins': 128, 'd_model': 1024, 'encoder_layers': 24, 'encoder_attention_heads': 16, 'encoder_ffn_dim': 4096, 'dropout': 0, 'attention_dropout': 0, 'activation_function': 'gelu', 'activation_dropout': 0, 'initializer_range': 0.02, 'scale_embedding': False, 'max_source_positions': 1500, 'n_window': 50, 'output_dim': 2048, 'n_window_infer': 800, 'conv_chunksize': 500, 'downsample_hidden_size': 480, 'output_attentions': False}, 'text_config': {'vocab_size': 151936, 'max_position_embeddings': 65536, 'hidden_size': 2048, 'intermediate_size': 6144, 'num_hidden_layers': 28, 'num_attention_heads': 16, 'num_key_value_heads': 8, 'head_dim': 128, 'hidden_act': 'silu', 'initializer_range': 0.02, 'rms_norm_eps': 1e-06, 'use_cache': False, 'rope_theta': 1000000, 'rope_scaling': {'interleaved': True, 'mrope_interleaved': True, 'mrope_section': [24, 20, 20], 'rope_type': 'default', 'type': 'default'}, 'attention_bias': False, 'attention_dropout': 0.0, 'return_dict': True, 'output_hidden_states': False, 'torchscript': False, 'dtype': None, 'pruned_heads': {}, 'tie_word_embeddings': True, 'chunk_size_feed_forward': 0, 'is_encoder_decoder': False, 'is_decoder': False, 'cross_attention_hidden_size': None, 'add_cross_attention': False, 'tie_encoder_decoder': False, 'architectures': None, 'finetuning_task': None, 'id2label': {0: 'LABEL_0', 1: 'LABEL_1'}, 'label2id': {'LABEL_0': 0, 'LABEL_1': 1}, 'task_specific_params': None, 'problem_type': None, 'tokenizer_class': None, 'prefix': None, 'bos_token_id': None, 'pad_token_id': 151643, 'eos_token_id': None, 'sep_token_id': None, 'decoder_start_token_id': None, 'max_length': 20, 'min_length': 0, 'do_sample': False, 'early_stopping': False, 'num_beams': 1, 'temperature': 1.0, 'top_k': 50, 'top_p': 1.0, 'typical_p': 1.0, 'repetition_penalty': 1.0, 'length_penalty': 1.0, 'no_repeat_ngram_size': 0, 'encoder_no_repeat_ngram_size': 0, 'bad_words_ids': None, 'num_return_sequences': 1, 'output_scores': False, 'return_dict_in_generate': False, 'forced_bos_token_id': None, 'forced_eos_token_id': None, 'remove_invalid_values': False, 'exponential_decay_length_penalty': None, 'suppress_tokens': None, 'begin_suppress_tokens': None, 'num_beam_groups': 1, 'diversity_penalty': 0.0, '_name_or_path': '', 'model_type': 'qwen3_asr_text', 'tf_legacy_loss': False, 'use_bfloat16': False, 'output_attentions': False}, 'audio_token_id': 151676, 'output_attentions': False}, 'support_languages': ['Chinese', 'English', 'Cantonese', 'Arabic', 'German', 'French', 'Spanish', 'Portuguese', 'Indonesian', 'Italian', 'Korean', 'Russian', 'Thai', 'Vietnamese', 'Japanese', 'Turkish', 'Hindi', 'Malay', 'Dutch', 'Swedish', 'Danish', 'Finnish', 'Polish', 'Czech', 'Filipino', 'Persian', 'Greek', 'Romanian', 'Hungarian', 'Macedonian'], 'output_attentions': False, 'output_dir': '/mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/0416upload/out/qwen3asr_dapo_reward56_4x4x12_12gen_4GPU/v5-20260418-172837', 'overwrite_output_dir': False, 'do_train': False, 'do_eval': True, 'do_predict': False, 'eval_strategy': 'steps', 'prediction_loss_only': False, 'per_device_train_batch_size': 4, 'per_device_eval_batch_size': 4, 'per_gpu_train_batch_size': None, 'per_gpu_eval_batch_size': None, 'gradient_accumulation_steps': 12, 'eval_accumulation_steps': None, 'eval_delay': 0, 'torch_empty_cache_steps': None, 'learning_rate': 5e-05, 'weight_decay': 0.1, 'adam_beta1': 0.9, 'adam_beta2': 0.95, 'adam_epsilon': 1e-08, 'max_grad_norm': 1.0, 'num_train_epochs': 3.0, 'max_steps': -1, 'lr_scheduler_type': 'cosine', 'lr_scheduler_kwargs': None, 'warmup_ratio': 0.03, 'warmup_steps': 0, 'log_level': 'passive', 'log_level_replica': 'warning', 'log_on_each_node': True, 'logging_dir': '/mnt/dhwfile/raise/user/panjiabao/huxiaobin/zhanghaobin/0416upload/out/qwen3asr_dapo_reward56_4x4x12_12gen_4GPU/v5-20260418-172837/runs', 'logging_strategy': 'steps', 'logging_first_step': True, 'logging_steps': 5, 'logging_nan_inf_filter': True, 'save_strategy': 'steps', 'save_steps': 20, 'save_total_limit': None, 'save_safetensors': True, 'save_on_each_node': False, 'save_only_model': False, 'restore_callback_states_from_checkpoint': False, 'no_cuda': False, 'use_cpu': False, 'use_mps_device': False, 'seed': 42, 'data_seed': 42, 'jit_mode_eval': False, 'bf16': True, 'fp16': False, 'fp16_opt_level': 'O1', 'half_precision_backend': 'auto', 'bf16_full_eval': False, 'fp16_full_eval': False, 'tf32': None, 'local_rank': 0, 'ddp_backend': None, 'tpu_num_cores': None, 'tpu_metrics_debug': False, 'debug': [], 'dataloader_drop_last': True, 'eval_steps': 20, 'dataloader_num_workers': 1, 'dataloader_prefetch_factor': 2, 'past_index': -1, 'run_name': 'qwen3asr_dapo_reward56_4x4x12_12gen_4GPU', 'disable_tqdm': False, 'remove_unused_columns': False, 'label_names': None, 'load_best_model_at_end': False, 'metric_for_best_model': 'loss', 'greater_is_better': False, 'ignore_data_skip': False, 'fsdp': [], 'fsdp_min_num_params': 0, 'fsdp_config': {'min_num_params': 0, 'xla': False, 'xla_fsdp_v2': False, 'xla_fsdp_grad_ckpt': False}, 'fsdp_transformer_layer_cls_to_wrap': None, 'accelerator_config': {'split_batches': False, 'dispatch_batches': False, 'even_batches': True, 'use_seedable_sampler': True, 'non_blocking': False, 'gradient_accumulation_kwargs': None}, 'parallelism_config': None, 'deepspeed': None, 'label_smoothing_factor': 0.0, 'optim': 'adamw_torch', 'optim_args': None, 'adafactor': False, 'group_by_length': False, 'length_column_name': 'length', 'report_to': ['wandb'], 'project': 'huggingface', 'trackio_space_id': 'trackio', 'ddp_find_unused_parameters': None, 'ddp_bucket_cap_mb': None, 'ddp_broadcast_buffers': None, 'dataloader_pin_memory': True, 'dataloader_persistent_workers': False, 'skip_memory_metrics': True, 'use_legacy_prediction_loop': False, 'push_to_hub': False, 'resume_from_checkpoint': None, 'hub_model_id': None, 'hub_strategy': 'every_save', 'hub_token': '<HUB_TOKEN>', 'hub_private_repo': None, 'hub_always_push': False, 'hub_revision': None, 'gradient_checkpointing': False, 'gradient_checkpointing_kwargs': None, 'include_inputs_for_metrics': False, 'include_for_metrics': [], 'eval_do_concat_batches': True, 'fp16_backend': 'auto', 'push_to_hub_model_id': None, 'push_to_hub_organization': None, 'push_to_hub_token': '<PUSH_TO_HUB_TOKEN>', 'mp_parameters': '', 'auto_find_batch_size': False, 'full_determinism': False, 'torchdynamo': None, 'ray_scope': 'last', 'ddp_timeout': 18000000, 'torch_compile': False, 'torch_compile_backend': None, 'torch_compile_mode': None, 'include_tokens_per_second': False, 'include_num_input_tokens_seen': 'no', 'neftune_noise_alpha': None, 'optim_target_modules': None, 'batch_eval_metrics': False, 'eval_on_start': False, 'use_liger_kernel': False, 'liger_kernel_config': None, 'eval_use_gather_object': False, 'average_tokens_across_devices': True, 'model_init_kwargs': None, 'disable_dropout': False, 'cast_lm_head_to_fp32': False, 'num_generations': 12, 'num_generations_eval': 4, 'max_completion_length': 256, 'ds3_gather_for_generation': True, 'shuffle_dataset': True, 'generation_batch_size': 48, 'steps_per_generation': 3, 'min_p': None, 'generation_kwargs': None, 'chat_template_kwargs': None, 'use_transformers_paged': False, 'cache_implementation': None, 'use_vllm': False, 'vllm_mode': None, 'vllm_model_impl': 'vllm', 'vllm_enable_sleep_mode': False, 'vllm_structured_outputs_regex': None, 'vllm_server_base_url': None, 'vllm_server_host': None, 'vllm_server_port': [8000], 'vllm_server_timeout': 240.0, 'vllm_group_port': 51216, 'vllm_gpu_memory_utilization': 0.9, 'vllm_max_model_length': None, 'vllm_tensor_parallel_size': 1, 'beta': 0.04, 'num_iterations': 2, 'epsilon': 0.2, 'delta': None, 'epsilon_high': 0.28, 'sapo_temperature_neg': 1.05, 'sapo_temperature_pos': 1.0, 'importance_sampling_level': 'token', 'reward_weights': None, 'multi_objective_aggregation': 'sum_then_normalize', 'scale_rewards': 'group', 'loss_type': 'dapo', 'mask_truncated_completions': False, 'sync_ref_model': False, 'ref_model_mixup_alpha': 0.6, 'ref_model_sync_steps': 512, 'top_entropy_quantile': 1.0, 'max_tool_calling_iterations': None, 'vllm_importance_sampling_correction': True, 'vllm_importance_sampling_mode': 'sequence_mask', 'vllm_importance_sampling_cap': 3.0, 'off_policy_mask_threshold': None, 'use_bias_correction_kl': False, 'log_completions': True, 'num_completions_to_print': None, 'log_unique_prompts': False, 'log_completions_hub_repo': None, 'tuner_backend': 'peft', 'vit_gradient_checkpointing': True, 'router_aux_loss_coef': 0.0, 'enable_dft_loss': False, 'enable_channel_loss': False, 'safe_serialization': True, 'max_shard_size': '5GB', 'check_model': True, 'acc_strategy': 'token', 'train_dataloader_shuffle': True, 'max_epochs': None, 'aligner_lr': None, 'vit_lr': None, 'use_logits_to_keep': None, 'resume_only_model': False, 'optimizer': None, 'eval_metric': None, 'callbacks': [], 'early_stop_interval': None, 'eval_use_evalscope': False, 'eval_dataset': [], 'eval_dataset_args': None, 'eval_limit': None, 'eval_generation_config': None, 'extra_eval_args': None, 'tuner_type': 'lora', 'use_galore': False, 'galore_target_modules': None, 'galore_rank': 128, 'galore_update_proj_gap': 50, 'galore_scale': 1.0, 'galore_proj_type': 'std', 'galore_optim_per_parameter': False, 'galore_with_embedding': False, 'galore_quantization': False, 'galore_proj_quant': False, 'galore_proj_bits': 4, 'galore_proj_group_size': 256, 'galore_cos_threshold': 0.4, 'galore_gamma_proj': 2, 'galore_queue_size': 5, 'lisa_activated_layers': 0, 'lisa_step_interval': 20, 'use_flash_ckpt': False, 'vllm_pipeline_parallel_size': 1, 'vllm_enable_expert_parallel': False, 'vllm_max_num_seqs': None, 'vllm_max_model_len': None, 'vllm_disable_custom_all_reduce': True, 'vllm_enforce_eager': False, 'vllm_limit_mm_per_prompt': None, 'vllm_max_lora_rank': 16, 'vllm_enable_prefix_caching': True, 'vllm_use_async_engine': None, 'vllm_quantization': None, 'vllm_reasoning_parser': None, 'vllm_disable_cascade_attn': False, 'vllm_mm_processor_cache_gb': None, 'vllm_speculative_config': None, 'vllm_engine_kwargs': {}, 'vllm_data_parallel_size': 1, 'stop_words': [], 'vllm_enable_lora': False, 'lora_rank': 8, 'vllm_server_group_port': None, 'enable_flattened_weight_sync': True, 'async_generate': False, 'structured_outputs_regex': None, 'sleep_level': 0, 'move_model_batches': None, 'offload_optimizer': False, 'offload_model': False, 'wandb_log_unique_prompts': None, 'cosine_min_len_value_wrong': -0.5, 'cosine_max_len_value_wrong': 0.0, 'cosine_min_len_value_correct': 1.0, 'cosine_max_len_value_correct': 0.5, 'cosine_max_len': 256, 'repetition_n_grams': 3, 'repetition_max_penalty': -1.0, 'reward_model': None, 'reward_model_plugin': None, 'chord_sft_dataset': [], 'chord_sft_per_device_train_batch_size': None, 'chord_enable_phi_function': False, 'chord_mu_warmup_steps': None, 'chord_mu_decay_steps': None, 'chord_mu_peak': None, 'chord_mu_valley': None, 'multi_turn_scheduler': None, 'max_turns': None, 'completion_length_limit_scope': 'per_round', 'vllm_server_pass_dataset': False, 'dynamic_sample': True, 'max_resample_times': 4, 'overlong_filter': True, 'soft_max_length': None, 'soft_cache_length': None, 'log_entropy': False, 'tau_pos': 1.0, 'tau_neg': 1.05, 'advantage_estimator': 'grpo', 'kl_in_reward': False, 'dataset_shuffle': True, 'rollout_importance_sampling_mode': None, 'rollout_importance_sampling_threshold': 2.0, 'log_rollout_offpolicy_metrics': False, 'off_policy_sequence_mask_delta': None}
23
+ 2026-04-18 17:28:50,239 INFO MainThread:10295 [wandb_config.py:__setitem__():154] [no run ID] config set model/num_parameters = 2050307712 - <bound method Run._config_callback of <wandb.sdk.wandb_run.Run object at 0x7f7e494768f0>>
24
+ 2026-04-18 17:28:50,239 INFO MainThread:10295 [wandb_run.py:_config_callback():1385] config_cb model/num_parameters 2050307712 None
25
+ 2026-04-20 16:05:30,791 INFO wandb-AsyncioManager-main:10295 [service_client.py:_forward_responses():80] Reached EOF.
26
+ 2026-04-20 16:05:30,792 INFO wandb-AsyncioManager-main:10295 [mailbox.py:close():137] Closing mailbox, abandoning 1 handles.