live-lm-critic / gec /download_data.sh
Olivia Figueira
Upload code with streamlit addition
b6e5241
conda activate errant200
######################## Set up benckmarks ########################
mkdir -p benchmarks
cd benchmarks
#Prepare CoNLL2014
wget https://www.comp.nus.edu.sg/~nlp/conll14st/conll14st-test-data.tar.gz
tar -xf conll14st-test-data.tar.gz
python3 scripts/get_orig_from_m2.py conll14st-test-data/noalt/official-2014.combined.m2 \
-out conll14st-test-data/noalt/official-2014.combined.orig.txt
#Prepare BEA2019
wget https://www.cl.cam.ac.uk/research/nl/bea2019st/data/wi+locness_v2.1.bea19.tar.gz
tar -xf wi+locness_v2.1.bea19.tar.gz
mv wi+locness wi+locness_v2.1.bea19
python3 scripts/get_orig_from_m2.py wi+locness_v2.1.bea19/m2/ABCN.dev.gold.bea19.m2 \
-out wi+locness_v2.1.bea19/m2/ABCN.dev.bea19.orig.txt
#Prepare GMEG-wiki and -yahoo
git clone https://github.com/grammarly/GMEG.git
root=GMEG/data/test/wiki
errant_parallel -orig $root/source \
-cor $root/ref0 $root/ref1 $root/ref2 $root/ref3 \
-out $root/ref.m2
root=GMEG/data/test/yahoo
errant_parallel -orig $root/source \
-cor $root/ref0 $root/ref1 $root/ref2 $root/ref3 \
-out $root/ref.m2
#Download M2 scorer
git clone https://github.com/nusnlp/m2scorer.git
######################## Download training data ########################
cd ../
wget https://nlp.stanford.edu/projects/myasu/LM-Critic/data.zip
unzip data.zip