File size: 1,075 Bytes
ee0ec3d
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
#!/bin/sh

[ $# -ge 2 ] || { echo Usage $0 datadir date >&2; exit 1; }
data="$1"; shift
date="$1"; shift

for treebank in $(cut -f1 ../$data/langs_sizes); do
  case $treebank in *_all) continue; esac

  lang=${treebank%%_*}
  if [ -d ../$data/${lang}_all ] && ! grep -q "^$treebank\$" models_non_shared.txt; then
    rsync -av -m --delete --exclude *.v2 --exclude training.log ../models/$data-${lang}_all/ ${lang}_all-$data-$date.model
    ln -fsn ${lang}_all-$data-$date.model $treebank-$data-$date.model
  else
    rsync -av -m --delete --exclude *.v2 --exclude training.log ../models/$data-$treebank/ $treebank-$data-$date.model
  fi
done

for treebank in $(cut -f1 ../$data/langs_sizes); do
  case $treebank in *_all) continue; esac

  cp ~/repos/udpipe/training/models-$data-tokenizer-chosen/$treebank/$treebank.model $treebank-$data-$date.model/$treebank.tokenizer

  consistent_feats=$treebank-$data-$date.model/consistent_feats.table
  [ -f "$consistent_feats " ] || python3 ../scripts/gen_consistent_feats_tables.py ${treebank%%_*} $(dirname $consistent_feats)
done