File size: 390 Bytes
9b2cded
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
#!/usr/bin/env bash
set -euo pipefail

DATA="${1:-data/sql_errors_dev.parquet}"
OUTPUT="${2:-models/codebert-cross-encoder}"
SAMPLES="${3:-}"

CMD=(python -m src.hf_train_codebert --data "${DATA}" --output-dir "${OUTPUT}")

if [[ -n "${SAMPLES}" ]]; then
  CMD+=(--max-samples "${SAMPLES}")
fi

echo "==> Training CodeBERT cross-encoder..."
"${CMD[@]}"

echo "==> Done. Model at ${OUTPUT}"