DerivedFunction1 commited on
Commit
163392a
·
verified ·
1 Parent(s): 78e91e0

Update README.md

Browse files
Files changed (1) hide show
  1. README.md +116 -2
README.md CHANGED
@@ -4,17 +4,131 @@ license: mit
4
  base_model: xlm-roberta-base
5
  tags:
6
  - generated_from_trainer
 
7
  metrics:
8
  - precision
9
  - recall
10
  - f1
11
  - accuracy
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
12
  model-index:
13
- - name: xlmr-language-identification
14
  results: []
 
 
 
 
 
 
 
 
 
15
  ---
16
 
17
-
18
  # Polyglot Tagger: Multi-label Language Identification
19
 
20
  Refer to `polyglot-tagger/language-identification`. It is trained on the same dataset as a text-classifier rather than as a token classifier.
 
4
  base_model: xlm-roberta-base
5
  tags:
6
  - generated_from_trainer
7
+ - language-identification
8
  metrics:
9
  - precision
10
  - recall
11
  - f1
12
  - accuracy
13
+ language:
14
+ - multilingual
15
+ - af
16
+ - am
17
+ - ar
18
+ - as
19
+ - ba
20
+ - be
21
+ - bg
22
+ - bn
23
+ - bo
24
+ - br
25
+ - bs
26
+ - ca
27
+ - ce
28
+ - ckb
29
+ - cs
30
+ - cy
31
+ - da
32
+ - de
33
+ - dv
34
+ - el
35
+ - en
36
+ - eo
37
+ - es
38
+ - et
39
+ - eu
40
+ - fa
41
+ - fi
42
+ - fr
43
+ - ga
44
+ - gd
45
+ - gl
46
+ - gu
47
+ - he
48
+ - hi
49
+ - hr
50
+ - hu
51
+ - hy
52
+ - id
53
+ - is
54
+ - it
55
+ - ja
56
+ - jv
57
+ - ka
58
+ - kk
59
+ - km
60
+ - kn
61
+ - ko
62
+ - ku
63
+ - ky
64
+ - la
65
+ - lb
66
+ - lo
67
+ - lt
68
+ - lv
69
+ - mg
70
+ - mk
71
+ - ml
72
+ - mn
73
+ - mr
74
+ - ms
75
+ - mt
76
+ - my
77
+ - ne
78
+ - nl
79
+ - 'no'
80
+ - ny
81
+ - oc
82
+ - om
83
+ - or
84
+ - pa
85
+ - pl
86
+ - ps
87
+ - pt
88
+ - rm
89
+ - ro
90
+ - ru
91
+ - sd
92
+ - si
93
+ - sk
94
+ - sl
95
+ - so
96
+ - sq
97
+ - sr
98
+ - su
99
+ - sv
100
+ - sw
101
+ - ta
102
+ - te
103
+ - tg
104
+ - th
105
+ - ti
106
+ - tl
107
+ - tr
108
+ - tt
109
+ - ug
110
+ - uk
111
+ - ur
112
+ - uz
113
+ - vi
114
+ - yo
115
+ - yi
116
+ - zh
117
+ - zu
118
  model-index:
119
+ - name: polyglot-tagger
120
  results: []
121
+ datasets:
122
+ - wikimedia/wikipedia
123
+ - HuggingFaceFW/finetranslations
124
+ - google/smol
125
+ - polyglot-tagger/nlp-noise-snippets
126
+ - polyglot-tagger/wikipedia-language-snippets-filtered
127
+ - polyglot-tagger/finetranslations-filtered
128
+ - polyglot-tagger/tatoeba-filtered
129
+ pipeline_tag: text-classification
130
  ---
131
 
 
132
  # Polyglot Tagger: Multi-label Language Identification
133
 
134
  Refer to `polyglot-tagger/language-identification`. It is trained on the same dataset as a text-classifier rather than as a token classifier.