Docgenie-API / scripts /experiments /02_v2_sampling_eval /train_entity_labeling.sh
Ahadhassan-2003
deploy: update HF Space
5c36ec7
#!/bin/bash
# Resolve relative path to run_base.sh (works no matter where you run this from)
SCRIPT_DIR="$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)"
BASE_SCRIPT="${SCRIPT_DIR}/base.sh"
declare -a model_configs=(
"layoutlmv3|--model-name microsoft/layoutlmv3-base --tokenizer-name microsoft/layoutlmv3-base --use-segment-level-bboxes"
)
declare -a dataset_names=(
# alpha 1.0
"cord"
# alpha 0.75
"cord"
# alpha 0.5
"cord"
)
declare -a synthetic_dataset_names=(
# alpha 1.0
"cord_alpha=1.0"
# alpha 0.75
"cord_alpha=0.75"
# alpha 0.5
"cord_alpha=0.5"
)
declare -a monitored_metrics=(
"validation/seqeval/f1_score"
"validation/seqeval/f1_score"
"validation/seqeval/f1_score"
)
TASK_ARGUMENTS="--optimizer adamw --lr-start 2.0e-5 --train-batch-size 16 --eval-batch-size 16 --num-epochs 100 --use-preprocessed-dataset"
# Call the shared base script
source "$BASE_SCRIPT" "$@"