| #!/usr/bin/env node |
|
|
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
|
|
| import fs from 'node:fs/promises'; |
| import path from 'node:path'; |
|
|
| function parseArgs(argv){ |
| const args = { in: '', out: '', seed: undefined, amount: 1, inPlace: false }; |
| for (let i = 2; i < argv.length; i++){ |
| const a = argv[i]; |
| if (a === '--in' && argv[i+1]) { args.in = argv[++i]; continue; } |
| if (a === '--out' && argv[i+1]) { args.out = argv[++i]; continue; } |
| if (a === '--seed' && argv[i+1]) { args.seed = Number(argv[++i]); continue; } |
| if (a === '--amount' && argv[i+1]) { args.amount = Number(argv[++i]) || 3; continue; } |
| if (a === '--in-place') { args.inPlace = true; continue; } |
| } |
| if (!args.in) throw new Error('--in is required'); |
| if (args.inPlace) args.out = args.in; |
| if (!args.out) { |
| const { dir, name, ext } = path.parse(args.in); |
| args.out = path.join(dir, `${name}.jitter${ext || '.csv'}`); |
| } |
| return args; |
| } |
|
|
| function mulberry32(seed){ |
| let t = seed >>> 0; |
| return function(){ |
| t += 0x6D2B79F5; |
| let r = Math.imul(t ^ (t >>> 15), 1 | t); |
| r ^= r + Math.imul(r ^ (r >>> 7), 61 | r); |
| return ((r ^ (r >>> 14)) >>> 0) / 4294967296; |
| }; |
| } |
|
|
| function makeRng(seed){ |
| if (Number.isFinite(seed)) return mulberry32(seed); |
| return Math.random; |
| } |
|
|
| function randn(rng){ |
| |
| let u = 0, v = 0; |
| while (u === 0) u = rng(); |
| while (v === 0) v = rng(); |
| return Math.sqrt(-2.0 * Math.log(u)) * Math.cos(2.0 * Math.PI * v); |
| } |
|
|
| function jitterValue(metric, value, amount, rng){ |
| const m = metric.toLowerCase(); |
| if (m === 'epoch') return value; |
| if (m.includes('accuracy')){ |
| const n = Math.max(-0.02 * amount, Math.min(0.02 * amount, randn(rng) * 0.01 * amount)); |
| return Math.max(0, Math.min(1, value + n)); |
| } |
| if (m.includes('loss')){ |
| const n = Math.max(-0.03 * amount, Math.min(0.03 * amount, randn(rng) * 0.01 * amount)); |
| return Math.max(0, value + n); |
| } |
| |
| const n = Math.max(-0.01 * amount, Math.min(0.01 * amount, randn(rng) * 0.005 * amount)); |
| return value + n; |
| } |
|
|
| function formatNumberLike(original, value){ |
| const s = String(original); |
| const dot = s.indexOf('.') |
| const decimals = dot >= 0 ? (s.length - dot - 1) : 0; |
| if (!Number.isFinite(value)) return s; |
| if (decimals <= 0) return String(Math.round(value)); |
| return value.toFixed(decimals); |
| } |
|
|
| async function main(){ |
| const args = parseArgs(process.argv); |
| const rng = makeRng(args.seed); |
| const raw = await fs.readFile(args.in, 'utf8'); |
| const lines = raw.split(/\r?\n/); |
| const out = new Array(lines.length); |
|
|
| for (let i = 0; i < lines.length; i++){ |
| const line = lines[i]; |
| if (!line || line.trim().length === 0) { out[i] = line; continue; } |
| if (/^\s*#/.test(line)) { out[i] = line; continue; } |
|
|
| |
| if (i === 0 && /^\s*run\s*,\s*step\s*,\s*metric\s*,\s*value\s*,\s*stderr\s*$/i.test(line)) { |
| out[i] = line; continue; |
| } |
|
|
| const cols = line.split(','); |
| if (cols.length < 4) { out[i] = line; continue; } |
|
|
| const [run, stepStr, metric, valueStr, stderrStr = ''] = cols; |
| const trimmedMetric = (metric || '').trim(); |
| const valueNum = Number((valueStr || '').trim()); |
|
|
| if (!Number.isFinite(valueNum)) { out[i] = line; continue; } |
|
|
| const jittered = jitterValue(trimmedMetric, valueNum, args.amount, rng); |
| const valueOut = formatNumberLike(valueStr, jittered); |
|
|
| |
| const result = [run, stepStr, metric, valueOut, stderrStr].join(','); |
| out[i] = result; |
| } |
|
|
| const finalText = out.join('\n'); |
| await fs.writeFile(args.out, finalText, 'utf8'); |
| const relIn = path.relative(process.cwd(), args.in); |
| const relOut = path.relative(process.cwd(), args.out); |
| console.log(`Jittered data written: ${relOut} (from ${relIn})`); |
| } |
|
|
| main().catch(err => { |
| console.error(err?.stack || String(err)); |
| process.exit(1); |
| }); |
|
|