File size: 660 Bytes
ee0ec3d
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
#!/bin/sh

[ $# -ge 1 ] || { echo Usage $0 datadir >&2; exit 1; }
data="$1"; shift

for d in ../$data/*/; do
  case $d in
    *_all/) continue;;
  esac

  has_xpos=$(grep -P "^\d+\t" $d$(basename ${d%/})-ud-test.conllu | cut -f5 | uniq | wc -l | perl -ple '$_=$_ > 1 ? 1 : 0')
  has_feats=$(grep -P "^\d+\t" $d$(basename ${d%/})-ud-test.conllu | cut -f6 | uniq | wc -l | perl -ple '$_=$_ > 1 ? 1 : 0')
  has_lemmas=$(grep -P "^\d+\t" $d$(basename ${d%/})-ud-test.conllu | cut -f3 | uniq | wc -l | perl -ple '$_=$_ > 1 ? 1 : 0')
  [ $has_xpos = 0 ] && echo $d: no XPOS
  [ $has_feats = 0 ] && echo $d: no UFeats
  [ $has_lemmas = 0 ] && echo $d: no Lemmas
done