Added new model trained on 60 epochs

Browse files

Files changed (13) hide show

README.md +9 -6
wav2vec2-large-xlsr-greek/checkpoint-18400/config.json → config.json +0 -0
wav2vec2-large-xlsr-greek/checkpoint-18400/preprocessor_config.json → preprocessor_config.json +0 -0
wav2vec2-large-xlsr-greek/checkpoint-18400/pytorch_model.bin → pytorch_model.bin +0 -0
wav2vec2-large-xlsr-greek/special_tokens_map.json → special_tokens_map.json +0 -0
wav2vec2-large-xlsr-greek/tokenizer_config.json → tokenizer_config.json +0 -0
wav2vec2-large-xlsr-greek/checkpoint-18400/trainer_state.json → trainer_state.json +0 -0
wav2vec2-large-xlsr-greek/checkpoint-18400/training_args.bin → training_args.bin +0 -0
vocab.json +1 -1
wav2vec2-large-xlsr-greek/checkpoint-18400/optimizer.pt +0 -3
wav2vec2-large-xlsr-greek/checkpoint-18400/scheduler.pt +0 -3
wav2vec2-large-xlsr-greek/preprocessor_config.json +0 -8
wav2vec2-large-xlsr-greek/vocab.json +0 -1

README.md CHANGED Viewed

@@ -1,12 +1,13 @@
 ---
-language:
-- el
 tags:
-- pytorch
-- ASR
 ---
 # Greek (el) version of the XLSR-Wav2Vec2 automatic speech recognition (ASR) model
@@ -28,6 +29,8 @@ This model was trained on Greek CommonVoice speech data (364MB) for 30 epochs on
 ### How to use for inference:
 Instructions to test on CommonVoice extracts are provided in the ASR_Inference.ipynb. Snippet also available below:
 ```

 ---
+language: el
+datasets:
+- common_voice
 tags:
+- speech
+- audio
+- automatic-speech-recognition
+license: apache-2.0
 ---
 # Greek (el) version of the XLSR-Wav2Vec2 automatic speech recognition (ASR) model
 ### How to use for inference:
+For live demo, make sure that speech files are sampled at 16kHz.
 Instructions to test on CommonVoice extracts are provided in the ASR_Inference.ipynb. Snippet also available below:
 ```

wav2vec2-large-xlsr-greek/checkpoint-18400/config.json → config.json RENAMED Viewed

File without changes

wav2vec2-large-xlsr-greek/checkpoint-18400/preprocessor_config.json → preprocessor_config.json RENAMED Viewed

File without changes

wav2vec2-large-xlsr-greek/checkpoint-18400/pytorch_model.bin → pytorch_model.bin RENAMED Viewed

File without changes

wav2vec2-large-xlsr-greek/special_tokens_map.json → special_tokens_map.json RENAMED Viewed

File without changes

wav2vec2-large-xlsr-greek/tokenizer_config.json → tokenizer_config.json RENAMED Viewed

File without changes

wav2vec2-large-xlsr-greek/checkpoint-18400/trainer_state.json → trainer_state.json RENAMED Viewed

File without changes

wav2vec2-large-xlsr-greek/checkpoint-18400/training_args.bin → training_args.bin RENAMED Viewed

File without changes

vocab.json CHANGED Viewed

@@ -1 +1 @@

- {"~~\u03c8~~": 0, "~~\u03bc~~": 1, "~~\u03c3~~": 2, "~~\u00b4~~": 3, "~~\u0301~~": 4, "v": 6, "~~\u03ad~~": 7, "~~\u03ac~~": 8, "~~\u03ba~~": 9, "~~\u03c5~~": 10, "~~\u03b3~~": 11, "~~\u03b7~~": 12, "~~\u03c7~~": 13, "~~\u03be~~": 14, "m": 15, "~~\u00bb~~": 16, "~~\u03b2~~": 17, "'": 18, "~~\u03b5~~": 19, "~~\u03c6~~": 20, "~~\u03b6~~": 21, "~~\u03b1~~": 22, "~~\u03ae~~": ~~23, "\u03c2":~~ 24, "~~\u2019~~": 25, "~~\u03bf~~": 26, "~~\u03cd~~": 27, "~~\u03b9~~": 28, "~~\u03c9~~": 29, "g": 30, "h": 31, "~~\u00ab~~": 32, "~~\u03cb~~": 33, "~~\u03bb~~": 34, "r": 35, "~~\u03af~~": 36, "~~\u03ca~~": 37, "~~\u03b4~~": 38, "~~\u0390~~": 39, "a": 40, "~~\u03c0~~": 41, "~~\u03c4~~": 42, "e": 43, "o": 44, "n": 45, "~~\u03b8~~": 46, "~~\u03ce~~": 47, "~~\u03c1~~": 48, "~~\u03cc~~": 49, "~~\u03bd~~": 50, "|": 5, "[UNK]": 51, "[PAD]": 52}

+ {"ώ": 0, "γ": 1, "n": 2, "ϋ": 3, "κ": 4, "e": 5, "ξ": 6, "'": 7, "θ": 8, "’": 9, "σ": 10, "η": 11, "ι": 12, "α": 13, "ε": 14, "υ": 15, "v": 16, "μ": 17, "ο": 18, "«": 19, "»": 20, "έ": 21, "ν": 22, "ά": 24, "o": 25, "ζ": 26, "β": 27, "τ": 28, "π": 29, "ή": 30, "ψ": 31, "ΐ": 32, "ό": 33, "h": 34, "ύ": 35, "ω": 36, "´": 37, "χ": 38, "ϊ": 39, "ρ": 40, "a": 41, "ς": 42, "r": 43, "g": 44, "m": 45, "λ": 46, "́": 47, "ί": 48, "φ": 49, "δ": 50, "|": 23, "[UNK]": 51, "[PAD]": 52}

wav2vec2-large-xlsr-greek/checkpoint-18400/optimizer.pt DELETED Viewed

@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:272a2cd55e47d89c16aadfc21a5186b3c1ee4f0dd61f67d1dfbe6e325392f208
-size 2490511751

wav2vec2-large-xlsr-greek/checkpoint-18400/scheduler.pt DELETED Viewed

@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:191d69c70a4b492d24ee1d59dad04edf9839c09a08b9cc6bd41530cfdaa0092c
-size 623

wav2vec2-large-xlsr-greek/preprocessor_config.json DELETED Viewed

@@ -1,8 +0,0 @@
-{
-  "do_normalize": true,
-  "feature_size": 1,
-  "padding_side": "right",
-  "padding_value": 0.0,
-  "return_attention_mask": true,
-  "sampling_rate": 16000
-}

wav2vec2-large-xlsr-greek/vocab.json DELETED Viewed

@@ -1 +0,0 @@

- {"ώ": 0, "γ": 1, "n": 2, "ϋ": 3, "κ": 4, "e": 5, "ξ": 6, "'": 7, "θ": 8, "’": 9, "σ": 10, "η": 11, "ι": 12, "α": 13, "ε": 14, "υ": 15, "v": 16, "μ": 17, "ο": 18, "«": 19, "»": 20, "έ": 21, "ν": 22, "ά": 24, "o": 25, "ζ": 26, "β": 27, "τ": 28, "π": 29, "ή": 30, "ψ": 31, "ΐ": 32, "ό": 33, "h": 34, "ύ": 35, "ω": 36, "´": 37, "χ": 38, "ϊ": 39, "ρ": 40, "a": 41, "ς": 42, "r": 43, "g": 44, "m": 45, "λ": 46, "́": 47, "ί": 48, "φ": 49, "δ": 50, "|": 23, "[UNK]": 51, "[PAD]": 52}