Dandan0K commited on
Commit
45fa43e
1 Parent(s): 9937232

Upload folder using huggingface_hub

Browse files
.gitattributes CHANGED
@@ -1,35 +1,27 @@
1
  *.7z filter=lfs diff=lfs merge=lfs -text
2
  *.arrow filter=lfs diff=lfs merge=lfs -text
3
  *.bin filter=lfs diff=lfs merge=lfs -text
 
4
  *.bz2 filter=lfs diff=lfs merge=lfs -text
5
- *.ckpt filter=lfs diff=lfs merge=lfs -text
6
  *.ftz filter=lfs diff=lfs merge=lfs -text
7
  *.gz filter=lfs diff=lfs merge=lfs -text
8
  *.h5 filter=lfs diff=lfs merge=lfs -text
9
  *.joblib filter=lfs diff=lfs merge=lfs -text
10
  *.lfs.* filter=lfs diff=lfs merge=lfs -text
11
- *.mlmodel filter=lfs diff=lfs merge=lfs -text
12
  *.model filter=lfs diff=lfs merge=lfs -text
13
  *.msgpack filter=lfs diff=lfs merge=lfs -text
14
- *.npy filter=lfs diff=lfs merge=lfs -text
15
- *.npz filter=lfs diff=lfs merge=lfs -text
16
  *.onnx filter=lfs diff=lfs merge=lfs -text
17
  *.ot filter=lfs diff=lfs merge=lfs -text
18
  *.parquet filter=lfs diff=lfs merge=lfs -text
19
  *.pb filter=lfs diff=lfs merge=lfs -text
20
- *.pickle filter=lfs diff=lfs merge=lfs -text
21
- *.pkl filter=lfs diff=lfs merge=lfs -text
22
  *.pt filter=lfs diff=lfs merge=lfs -text
23
  *.pth filter=lfs diff=lfs merge=lfs -text
24
  *.rar filter=lfs diff=lfs merge=lfs -text
25
- *.safetensors filter=lfs diff=lfs merge=lfs -text
26
- saved_model/**/* filter=lfs diff=lfs merge=lfs -text
27
  *.tar.* filter=lfs diff=lfs merge=lfs -text
28
- *.tar filter=lfs diff=lfs merge=lfs -text
29
  *.tflite filter=lfs diff=lfs merge=lfs -text
30
  *.tgz filter=lfs diff=lfs merge=lfs -text
31
- *.wasm filter=lfs diff=lfs merge=lfs -text
32
  *.xz filter=lfs diff=lfs merge=lfs -text
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
- *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
 
1
  *.7z filter=lfs diff=lfs merge=lfs -text
2
  *.arrow filter=lfs diff=lfs merge=lfs -text
3
  *.bin filter=lfs diff=lfs merge=lfs -text
4
+ *.bin.* filter=lfs diff=lfs merge=lfs -text
5
  *.bz2 filter=lfs diff=lfs merge=lfs -text
 
6
  *.ftz filter=lfs diff=lfs merge=lfs -text
7
  *.gz filter=lfs diff=lfs merge=lfs -text
8
  *.h5 filter=lfs diff=lfs merge=lfs -text
9
  *.joblib filter=lfs diff=lfs merge=lfs -text
10
  *.lfs.* filter=lfs diff=lfs merge=lfs -text
 
11
  *.model filter=lfs diff=lfs merge=lfs -text
12
  *.msgpack filter=lfs diff=lfs merge=lfs -text
 
 
13
  *.onnx filter=lfs diff=lfs merge=lfs -text
14
  *.ot filter=lfs diff=lfs merge=lfs -text
15
  *.parquet filter=lfs diff=lfs merge=lfs -text
16
  *.pb filter=lfs diff=lfs merge=lfs -text
 
 
17
  *.pt filter=lfs diff=lfs merge=lfs -text
18
  *.pth filter=lfs diff=lfs merge=lfs -text
19
  *.rar filter=lfs diff=lfs merge=lfs -text
20
+ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
 
21
  *.tar.* filter=lfs diff=lfs merge=lfs -text
 
22
  *.tflite filter=lfs diff=lfs merge=lfs -text
23
  *.tgz filter=lfs diff=lfs merge=lfs -text
 
24
  *.xz filter=lfs diff=lfs merge=lfs -text
25
  *.zip filter=lfs diff=lfs merge=lfs -text
26
+ *.zstandard filter=lfs diff=lfs merge=lfs -text
27
  *tfevents* filter=lfs diff=lfs merge=lfs -text
README.md ADDED
@@ -0,0 +1,148 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ language:
3
+ - fr
4
+ license: apache-2.0
5
+ tags:
6
+ - automatic-speech-recognition
7
+ - fr
8
+ - hf-asr-leaderboard
9
+ - mozilla-foundation/common_voice_8_0
10
+ - robust-speech-event
11
+ datasets:
12
+ - mozilla-foundation/common_voice_8_0
13
+ model-index:
14
+ - name: XLS-R Wav2Vec2 French by Jonatas Grosman
15
+ results:
16
+ - task:
17
+ name: Automatic Speech Recognition
18
+ type: automatic-speech-recognition
19
+ dataset:
20
+ name: Common Voice 8
21
+ type: mozilla-foundation/common_voice_8_0
22
+ args: fr
23
+ metrics:
24
+ - name: Test WER
25
+ type: wer
26
+ value: 16.85
27
+ - name: Test CER
28
+ type: cer
29
+ value: 4.66
30
+ - name: Test WER (+LM)
31
+ type: wer
32
+ value: 16.32
33
+ - name: Test CER (+LM)
34
+ type: cer
35
+ value: 4.21
36
+ - task:
37
+ name: Automatic Speech Recognition
38
+ type: automatic-speech-recognition
39
+ dataset:
40
+ name: Robust Speech Event - Dev Data
41
+ type: speech-recognition-community-v2/dev_data
42
+ args: fr
43
+ metrics:
44
+ - name: Dev WER
45
+ type: wer
46
+ value: 22.34
47
+ - name: Dev CER
48
+ type: cer
49
+ value: 9.88
50
+ - name: Dev WER (+LM)
51
+ type: wer
52
+ value: 17.16
53
+ - name: Dev CER (+LM)
54
+ type: cer
55
+ value: 9.38
56
+ - task:
57
+ name: Automatic Speech Recognition
58
+ type: automatic-speech-recognition
59
+ dataset:
60
+ name: Robust Speech Event - Test Data
61
+ type: speech-recognition-community-v2/eval_data
62
+ args: fr
63
+ metrics:
64
+ - name: Test WER
65
+ type: wer
66
+ value: 19.15
67
+ ---
68
+
69
+ # Fine-tuned XLS-R 1B model for speech recognition in French
70
+
71
+ Fine-tuned [facebook/wav2vec2-xls-r-1b](https://huggingface.co/facebook/wav2vec2-xls-r-1b) on French using the train and validation splits of [Common Voice 8.0](https://huggingface.co/datasets/mozilla-foundation/common_voice_8_0), [MediaSpeech](https://www.openslr.org/108/), [Multilingual TEDx](http://www.openslr.org/100), [Multilingual LibriSpeech](https://www.openslr.org/94/), and [Voxpopuli](https://github.com/facebookresearch/voxpopuli).
72
+ When using this model, make sure that your speech input is sampled at 16kHz.
73
+
74
+ This model has been fine-tuned by the [HuggingSound](https://github.com/jonatasgrosman/huggingsound) tool, and thanks to the GPU credits generously given by the [OVHcloud](https://www.ovhcloud.com/en/public-cloud/ai-training/) :)
75
+
76
+ ## Usage
77
+
78
+ Using the [HuggingSound](https://github.com/jonatasgrosman/huggingsound) library:
79
+
80
+ ```python
81
+ from huggingsound import SpeechRecognitionModel
82
+
83
+ model = SpeechRecognitionModel("jonatasgrosman/wav2vec2-xls-r-1b-french")
84
+ audio_paths = ["/path/to/file.mp3", "/path/to/another_file.wav"]
85
+
86
+ transcriptions = model.transcribe(audio_paths)
87
+ ```
88
+
89
+ Writing your own inference script:
90
+
91
+ ```python
92
+ import torch
93
+ import librosa
94
+ from datasets import load_dataset
95
+ from transformers import Wav2Vec2ForCTC, Wav2Vec2Processor
96
+
97
+ LANG_ID = "fr"
98
+ MODEL_ID = "jonatasgrosman/wav2vec2-xls-r-1b-french"
99
+ SAMPLES = 10
100
+
101
+ test_dataset = load_dataset("common_voice", LANG_ID, split=f"test[:{SAMPLES}]")
102
+
103
+ processor = Wav2Vec2Processor.from_pretrained(MODEL_ID)
104
+ model = Wav2Vec2ForCTC.from_pretrained(MODEL_ID)
105
+
106
+ # Preprocessing the datasets.
107
+ # We need to read the audio files as arrays
108
+ def speech_file_to_array_fn(batch):
109
+ speech_array, sampling_rate = librosa.load(batch["path"], sr=16_000)
110
+ batch["speech"] = speech_array
111
+ batch["sentence"] = batch["sentence"].upper()
112
+ return batch
113
+
114
+ test_dataset = test_dataset.map(speech_file_to_array_fn)
115
+ inputs = processor(test_dataset["speech"], sampling_rate=16_000, return_tensors="pt", padding=True)
116
+
117
+ with torch.no_grad():
118
+ logits = model(inputs.input_values, attention_mask=inputs.attention_mask).logits
119
+
120
+ predicted_ids = torch.argmax(logits, dim=-1)
121
+ predicted_sentences = processor.batch_decode(predicted_ids)
122
+ ```
123
+
124
+ ## Evaluation Commands
125
+
126
+ 1. To evaluate on `mozilla-foundation/common_voice_8_0` with split `test`
127
+
128
+ ```bash
129
+ python eval.py --model_id jonatasgrosman/wav2vec2-xls-r-1b-french --dataset mozilla-foundation/common_voice_8_0 --config fr --split test
130
+ ```
131
+
132
+ 2. To evaluate on `speech-recognition-community-v2/dev_data`
133
+
134
+ ```bash
135
+ python eval.py --model_id jonatasgrosman/wav2vec2-xls-r-1b-french --dataset speech-recognition-community-v2/dev_data --config fr --split validation --chunk_length_s 5.0 --stride_length_s 1.0
136
+ ```
137
+
138
+ ## Citation
139
+ If you want to cite this model you can use this:
140
+
141
+ ```bibtex
142
+ @misc{grosman2021xlsr-1b-french,
143
+ title={Fine-tuned {XLS-R} 1{B} model for speech recognition in {F}rench},
144
+ author={Grosman, Jonatas},
145
+ howpublished={\url{https://huggingface.co/jonatasgrosman/wav2vec2-xls-r-1b-french}},
146
+ year={2022}
147
+ }
148
+ ```
alphabet.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"labels": ["", "<s>", "</s>", "\u2047", " ", "'", "-", "a", "b", "c", "d", "e", "f", "g", "h", "i", "j", "k", "l", "m", "n", "o", "p", "q", "r", "s", "t", "u", "v", "w", "x", "y", "z", "\u00e0", "\u00e2", "\u00e3", "\u00e7", "\u00e8", "\u00e9", "\u00ea", "\u00eb", "\u00ee", "\u00ef", "\u00f4", "\u00f9", "\u00fb", "\u0153"], "is_bpe": false}
config.json ADDED
@@ -0,0 +1,107 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "facebook/wav2vec2-xls-r-1b",
3
+ "activation_dropout": 0.05,
4
+ "adapter_kernel_size": 3,
5
+ "adapter_stride": 2,
6
+ "add_adapter": false,
7
+ "apply_spec_augment": true,
8
+ "architectures": [
9
+ "Wav2Vec2ForCTC"
10
+ ],
11
+ "attention_dropout": 0.05,
12
+ "bos_token_id": 1,
13
+ "classifier_proj_size": 256,
14
+ "codevector_dim": 1024,
15
+ "contrastive_logits_temperature": 0.1,
16
+ "conv_bias": true,
17
+ "conv_dim": [
18
+ 512,
19
+ 512,
20
+ 512,
21
+ 512,
22
+ 512,
23
+ 512,
24
+ 512
25
+ ],
26
+ "conv_kernel": [
27
+ 10,
28
+ 3,
29
+ 3,
30
+ 3,
31
+ 3,
32
+ 2,
33
+ 2
34
+ ],
35
+ "conv_stride": [
36
+ 5,
37
+ 2,
38
+ 2,
39
+ 2,
40
+ 2,
41
+ 2,
42
+ 2
43
+ ],
44
+ "ctc_loss_reduction": "mean",
45
+ "ctc_zero_infinity": false,
46
+ "diversity_loss_weight": 0.1,
47
+ "do_stable_layer_norm": true,
48
+ "eos_token_id": 2,
49
+ "feat_extract_activation": "gelu",
50
+ "feat_extract_dropout": 0.0,
51
+ "feat_extract_norm": "layer",
52
+ "feat_proj_dropout": 0.05,
53
+ "feat_quantizer_dropout": 0.0,
54
+ "final_dropout": 0.05,
55
+ "hidden_act": "gelu",
56
+ "hidden_dropout": 0.05,
57
+ "hidden_size": 1280,
58
+ "initializer_range": 0.02,
59
+ "intermediate_size": 5120,
60
+ "layer_norm_eps": 1e-05,
61
+ "layerdrop": 0.05,
62
+ "mask_feature_length": 10,
63
+ "mask_feature_min_masks": 0,
64
+ "mask_feature_prob": 0.0,
65
+ "mask_time_length": 10,
66
+ "mask_time_min_masks": 2,
67
+ "mask_time_prob": 0.05,
68
+ "model_type": "wav2vec2",
69
+ "num_adapter_layers": 3,
70
+ "num_attention_heads": 16,
71
+ "num_codevector_groups": 2,
72
+ "num_codevectors_per_group": 320,
73
+ "num_conv_pos_embedding_groups": 16,
74
+ "num_conv_pos_embeddings": 128,
75
+ "num_feat_extract_layers": 7,
76
+ "num_hidden_layers": 48,
77
+ "num_negatives": 100,
78
+ "output_hidden_size": 1280,
79
+ "pad_token_id": 0,
80
+ "proj_codevector_dim": 1024,
81
+ "tdnn_dilation": [
82
+ 1,
83
+ 2,
84
+ 3,
85
+ 1,
86
+ 1
87
+ ],
88
+ "tdnn_dim": [
89
+ 512,
90
+ 512,
91
+ 512,
92
+ 512,
93
+ 1500
94
+ ],
95
+ "tdnn_kernel": [
96
+ 5,
97
+ 3,
98
+ 3,
99
+ 1,
100
+ 1
101
+ ],
102
+ "torch_dtype": "float32",
103
+ "transformers_version": "4.16.0.dev0",
104
+ "use_weighted_layer_sum": false,
105
+ "vocab_size": 47,
106
+ "xvector_output_dim": 512
107
+ }
eval.py ADDED
@@ -0,0 +1,164 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ #!/usr/bin/env python3
2
+ from datasets import load_dataset, load_metric, Audio, Dataset
3
+ from transformers import pipeline, AutoFeatureExtractor, AutoTokenizer, AutoConfig, AutoModelForCTC, Wav2Vec2Processor, Wav2Vec2ProcessorWithLM
4
+ import re
5
+ import torch
6
+ import argparse
7
+ from typing import Dict
8
+
9
+ def log_results(result: Dataset, args: Dict[str, str]):
10
+ """ DO NOT CHANGE. This function computes and logs the result metrics. """
11
+
12
+ log_outputs = args.log_outputs
13
+ dataset_id = "_".join(args.dataset.split("/") + [args.config, args.split])
14
+
15
+ # load metric
16
+ wer = load_metric("wer")
17
+ cer = load_metric("cer")
18
+
19
+ # compute metrics
20
+ wer_result = wer.compute(references=result["target"], predictions=result["prediction"])
21
+ cer_result = cer.compute(references=result["target"], predictions=result["prediction"])
22
+
23
+ # print & log results
24
+ result_str = (
25
+ f"WER: {wer_result}\n"
26
+ f"CER: {cer_result}"
27
+ )
28
+ print(result_str)
29
+
30
+ with open(f"{dataset_id}_eval_results.txt", "w") as f:
31
+ f.write(result_str)
32
+
33
+ # log all results in text file. Possibly interesting for analysis
34
+ if log_outputs is not None:
35
+ pred_file = f"log_{dataset_id}_predictions.txt"
36
+ target_file = f"log_{dataset_id}_targets.txt"
37
+
38
+ with open(pred_file, "w") as p, open(target_file, "w") as t:
39
+
40
+ # mapping function to write output
41
+ def write_to_file(batch, i):
42
+ p.write(f"{i}" + "\n")
43
+ p.write(batch["prediction"] + "\n")
44
+ t.write(f"{i}" + "\n")
45
+ t.write(batch["target"] + "\n")
46
+
47
+ result.map(write_to_file, with_indices=True)
48
+
49
+
50
+ def normalize_text(text: str, invalid_chars_regex: str, to_lower: bool) -> str:
51
+ """ DO ADAPT FOR YOUR USE CASE. this function normalizes the target text. """
52
+
53
+ text = text.lower() if to_lower else text.upper()
54
+
55
+ text = re.sub(invalid_chars_regex, " ", text)
56
+
57
+ text = re.sub("\s+", " ", text).strip()
58
+
59
+ return text
60
+
61
+
62
+ def main(args):
63
+ # load dataset
64
+ dataset = load_dataset(args.dataset, args.config, split=args.split, use_auth_token=True)
65
+
66
+ # for testing: only process the first two examples as a test
67
+ # dataset = dataset.select(range(10))
68
+
69
+ # load processor
70
+ if args.greedy:
71
+ processor = Wav2Vec2Processor.from_pretrained(args.model_id)
72
+ decoder = None
73
+ else:
74
+ processor = Wav2Vec2ProcessorWithLM.from_pretrained(args.model_id)
75
+ decoder = processor.decoder
76
+
77
+ feature_extractor = processor.feature_extractor
78
+ tokenizer = processor.tokenizer
79
+
80
+ # resample audio
81
+ dataset = dataset.cast_column("audio", Audio(sampling_rate=feature_extractor.sampling_rate))
82
+
83
+ # load eval pipeline
84
+ if args.device is None:
85
+ args.device = 0 if torch.cuda.is_available() else -1
86
+
87
+ config = AutoConfig.from_pretrained(args.model_id)
88
+ model = AutoModelForCTC.from_pretrained(args.model_id)
89
+
90
+ #asr = pipeline("automatic-speech-recognition", model=args.model_id, device=args.device)
91
+ asr = pipeline("automatic-speech-recognition", config=config, model=model, tokenizer=tokenizer,
92
+ feature_extractor=feature_extractor, decoder=decoder, device=args.device)
93
+
94
+ # build normalizer config
95
+ tokenizer = AutoTokenizer.from_pretrained(args.model_id)
96
+ tokens = [x for x in tokenizer.convert_ids_to_tokens(range(0, tokenizer.vocab_size))]
97
+ special_tokens = [
98
+ tokenizer.pad_token, tokenizer.word_delimiter_token,
99
+ tokenizer.unk_token, tokenizer.bos_token,
100
+ tokenizer.eos_token,
101
+ ]
102
+ non_special_tokens = [x for x in tokens if x not in special_tokens]
103
+ invalid_chars_regex = f"[^\s{re.escape(''.join(set(non_special_tokens)))}]"
104
+ normalize_to_lower = False
105
+ for token in non_special_tokens:
106
+ if token.isalpha() and token.islower():
107
+ normalize_to_lower = True
108
+ break
109
+
110
+ # map function to decode audio
111
+ def map_to_pred(batch, args=args, asr=asr, invalid_chars_regex=invalid_chars_regex, normalize_to_lower=normalize_to_lower):
112
+ prediction = asr(batch["audio"]["array"], chunk_length_s=args.chunk_length_s, stride_length_s=args.stride_length_s)
113
+
114
+ batch["prediction"] = prediction["text"]
115
+ batch["target"] = normalize_text(batch["sentence"], invalid_chars_regex, normalize_to_lower)
116
+ return batch
117
+
118
+ # run inference on all examples
119
+ result = dataset.map(map_to_pred, remove_columns=dataset.column_names)
120
+
121
+ # filtering out empty targets
122
+ result = result.filter(lambda example: example["target"] != "")
123
+
124
+ # compute and log_results
125
+ # do not change function below
126
+ log_results(result, args)
127
+
128
+
129
+ if __name__ == "__main__":
130
+ parser = argparse.ArgumentParser()
131
+
132
+ parser.add_argument(
133
+ "--model_id", type=str, required=True, help="Model identifier. Should be loadable with 🤗 Transformers"
134
+ )
135
+ parser.add_argument(
136
+ "--dataset", type=str, required=True, help="Dataset name to evaluate the `model_id`. Should be loadable with 🤗 Datasets"
137
+ )
138
+ parser.add_argument(
139
+ "--config", type=str, required=True, help="Config of the dataset. *E.g.* `'en'` for Common Voice"
140
+ )
141
+ parser.add_argument(
142
+ "--split", type=str, required=True, help="Split of the dataset. *E.g.* `'test'`"
143
+ )
144
+ parser.add_argument(
145
+ "--chunk_length_s", type=float, default=None, help="Chunk length in seconds. Defaults to None. For long audio files a good value would be 5.0 seconds."
146
+ )
147
+ parser.add_argument(
148
+ "--stride_length_s", type=float, default=None, help="Stride of the audio chunks. Defaults to None. For long audio files a good value would be 1.0 seconds."
149
+ )
150
+ parser.add_argument(
151
+ "--log_outputs", action='store_true', help="If defined, write outputs to log file for analysis."
152
+ )
153
+ parser.add_argument(
154
+ "--greedy", action='store_true', help="If defined, the LM will be ignored during inference."
155
+ )
156
+ parser.add_argument(
157
+ "--device",
158
+ type=int,
159
+ default=None,
160
+ help="The device to run the pipeline on. -1 for CPU (default), 0 for the first GPU and so on.",
161
+ )
162
+ args = parser.parse_args()
163
+
164
+ main(args)
full_eval.sh ADDED
@@ -0,0 +1,15 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ # CV 8 - TEST
2
+
3
+ python eval.py --model_id jonatasgrosman/wav2vec2-xls-r-1b-french --dataset mozilla-foundation/common_voice_8_0 --config fr --split test --log_outputs --greedy
4
+ mv log_mozilla-foundation_common_voice_8_0_fr_test_predictions.txt log_mozilla-foundation_common_voice_8_0_fr_test_predictions_greedy.txt
5
+ mv mozilla-foundation_common_voice_8_0_fr_test_eval_results.txt mozilla-foundation_common_voice_8_0_fr_test_eval_results_greedy.txt
6
+
7
+ python eval.py --model_id jonatasgrosman/wav2vec2-xls-r-1b-french --dataset mozilla-foundation/common_voice_8_0 --config fr --split test --log_outputs
8
+
9
+ # HF EVENT - DEV
10
+
11
+ python eval.py --model_id jonatasgrosman/wav2vec2-xls-r-1b-french --dataset speech-recognition-community-v2/dev_data --config fr --split validation --chunk_length_s 5.0 --stride_length_s 1.0 --log_outputs --greedy
12
+ mv log_speech-recognition-community-v2_dev_data_fr_validation_predictions.txt log_speech-recognition-community-v2_dev_data_fr_validation_predictions_greedy.txt
13
+ mv speech-recognition-community-v2_dev_data_fr_validation_eval_results.txt speech-recognition-community-v2_dev_data_fr_validation_eval_results_greedy.txt
14
+
15
+ python eval.py --model_id jonatasgrosman/wav2vec2-xls-r-1b-french --dataset speech-recognition-community-v2/dev_data --config fr --split validation --chunk_length_s 5.0 --stride_length_s 1.0 --log_outputs
language_model/attrs.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"alpha": 0.5, "beta": 1.5, "unk_score_offset": -10.0, "score_boundary": true}
language_model/lm.binary ADDED
Binary file (180 kB). View file
 
language_model/unigrams.txt ADDED
@@ -0,0 +1,2630 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ (adult_support
2
+ </s>
3
+ <s>
4
+ a
5
+ achètre
6
+ acuillère
7
+ adul
8
+ adult
9
+ agil
10
+ agilé
11
+ aie
12
+ aigui
13
+ aiguière
14
+ aimelle
15
+ air
16
+ ajaje
17
+ ak
18
+ akalada
19
+ akapade
20
+ akaskalade
21
+ akasse
22
+ akateur
23
+ alpaakapade
24
+ alève
25
+ amo
26
+ amour
27
+ amu
28
+ an
29
+ ananaoute
30
+ angalche
31
+ angeu
32
+ angl
33
+ anglache
34
+ anglage
35
+ anglageu
36
+ anglaggue
37
+ anglaye
38
+ anglaze
39
+ anglège
40
+ anglé
41
+ angèle
42
+ anjloge
43
+ anjo
44
+ anklage
45
+ anour
46
+ aou
47
+ aoute
48
+ août
49
+ apapaaparitian
50
+ aparipion
51
+ aparitssion
52
+ aparsion
53
+ aparssion
54
+ apartion
55
+ apartipari
56
+ apartizion
57
+ aparéssion
58
+ aparétion
59
+ aper
60
+ apotion
61
+ appar
62
+ apparition
63
+ appartirssion
64
+ apparédition
65
+ apparéssion
66
+ apparétion
67
+ appozilti
68
+ apprécian
69
+ apprétien
70
+ ar
71
+ arabe
72
+ aragil
73
+ arargil
74
+ arargliaguil
75
+ archchestre
76
+ archestre
77
+ archil
78
+ archéleu
79
+ archétreu
80
+ argile
81
+ argril
82
+ arguil
83
+ arguile
84
+ arguileu
85
+ arguilé
86
+ arkestre
87
+ arkiche
88
+ arré
89
+ aréar
90
+ arégil
91
+ ascalade
92
+ ascalope
93
+ askalope
94
+ asskajope
95
+ atrifle
96
+ azé
97
+
98
+ aéskalopé
99
+ b
100
+ baandi
101
+ babante
102
+ babaskét
103
+ badi
104
+ baie
105
+ baille
106
+ bain
107
+ bainbante
108
+ bainte
109
+ bak
110
+ baké
111
+ bala
112
+ balade
113
+ baladeu
114
+ balai
115
+ balansde
116
+ balante
117
+ balin
118
+ balon
119
+ balé
120
+ ban
121
+ banbandi
122
+ banbantite
123
+ bande
124
+ bandi
125
+ bandit
126
+ bane
127
+ baneur
128
+ banfonge
129
+ banieul
130
+ bannajeu
131
+ bante
132
+ banteu
133
+ baroce
134
+ bask
135
+ baske
136
+ baskede
137
+ basket
138
+ baskette
139
+ baskeuil
140
+ baské
141
+ basse
142
+ bati
143
+ baton
144
+ batte
145
+ baye
146
+ bbréteu
147
+ be
148
+ beberné
149
+ bebeul
150
+ beel
151
+ befagueu
152
+ bei
153
+ beli
154
+ bemurence
155
+ ben
156
+ beneur
157
+ bente
158
+ beui
159
+ beuil
160
+ beureu
161
+ beurné
162
+ beyuil
163
+ beèl
164
+ bien
165
+ biente
166
+ bieu
167
+ bif
168
+ bijelle
169
+ bijo
170
+ bindi
171
+ binfage
172
+ binjo
173
+ binte
174
+ binteu
175
+ biro
176
+ biyo
177
+ bl
178
+ bla
179
+ blanc
180
+ blank
181
+ blé
182
+ bléfassion
183
+ boche
184
+ boi
185
+ boil
186
+ boin
187
+ boire
188
+ bolieu
189
+ bolotte
190
+ bomon
191
+ bon
192
+ bonbente
193
+ bonbonde
194
+ bonbonfage
195
+ bonbonheur
196
+ bonbononeur
197
+ bonbumon
198
+ bonde
199
+ bonebonheur
200
+ boneubonheur
201
+ bonfa
202
+ bonfach
203
+ bonfage
204
+ bonfajeu
205
+ bonheur
206
+ bonheure
207
+ bonjageu
208
+ bonnebunebon
209
+ bonte
210
+ bonteu
211
+ bonté
212
+ bonvage
213
+ bonvaléskence
214
+ borniai
215
+ borté
216
+ bou
217
+ bouette
218
+ boufage
219
+ boufoi
220
+ boulboulan
221
+ boule
222
+ bouleau
223
+ bouleu
224
+ boullo
225
+ boulon
226
+ boulot
227
+ boulotte
228
+ bounheur
229
+ boyl
230
+ boèle
231
+ bra
232
+ bre
233
+ breu
234
+ breuil
235
+ breuté
236
+ bronbage
237
+ brou
238
+ bru
239
+ brudurence
240
+ brufondulence
241
+ brui
242
+ brume
243
+ brumedurence
244
+ brumeu
245
+ brumibubrumidurence
246
+ brumiderence
247
+ brumidi
248
+ brumidrence
249
+ brumidu
250
+ brumiduren
251
+ brumidurence
252
+ brumidurenceu
253
+ brumidurenze
254
+ brumiduresen
255
+ brumindurence
256
+ brumitrudurement
257
+ brumiturence
258
+ brumudirenk
259
+ brumudurence
260
+ brun
261
+ brune
262
+ brunidurence
263
+ brèbrète
264
+ brème
265
+ brète
266
+ bré
267
+ bu
268
+ bubei
269
+ bubuman
270
+ bubumon
271
+ buchurelle
272
+ bucurelle
273
+ buie
274
+ buil
275
+ bukerelle
276
+ bukrelle
277
+ bukulbukurelle
278
+ bukurle
279
+ bukuré
280
+ bulement
281
+ bulence
282
+ bulié
283
+ buman
284
+ bumisse
285
+ bumo
286
+ bumon
287
+ bun
288
+ buno
289
+ bunon
290
+ burkuresse
291
+ burme
292
+ burugreille
293
+ bururelle
294
+ bute
295
+ buturelle
296
+ bz
297
+
298
+ bète
299
+ béil
300
+ béjér
301
+ bér
302
+ béret
303
+ bérote
304
+ béré
305
+ béské
306
+ béssan
307
+ bézir
308
+ c
309
+ ca
310
+ cable
311
+ cacatastrophe
312
+ cacorpon
313
+ cafté
314
+ cahier
315
+ cala
316
+ calié
317
+ camande
318
+ camar
319
+ cande
320
+ canjo
321
+ car
322
+ cara
323
+ caraféfelle
324
+ caramel
325
+ caraval
326
+ caravaneu
327
+ caraveleu
328
+ caravelle
329
+ caravéveleu
330
+ carcardon
331
+ carcordonne
332
+ cardon
333
+ careu
334
+ carré
335
+ carsotrofeu
336
+ cartaffrofe
337
+ carte
338
+ carton
339
+ cartre
340
+ caré
341
+ cascatastrof
342
+ cascatastrophe
343
+ casier
344
+ caskaderof
345
+ casscazié
346
+ casser
347
+ cassi
348
+ cassier
349
+ cassion
350
+ cassière
351
+ cassié
352
+ casta
353
+ castastrof
354
+ castastrophe
355
+ castatastrophe
356
+ castatrophe
357
+ castor
358
+ castraf
359
+ catastrophe
360
+ catatof
361
+ catisseu
362
+ caval
363
+ cavelle
364
+ cazé
365
+ ccordon
366
+ ccouette
367
+ celcélié
368
+ celier
369
+ celié
370
+ cellier
371
+ celécellié
372
+ cerf
373
+ cerfe
374
+ cerffe
375
+ cerfon
376
+ ceureu
377
+ ch
378
+ cha
379
+ chacaleur
380
+ chal
381
+ chale
382
+ chaleur
383
+ chalo
384
+ chalou
385
+ cham
386
+ chambre
387
+ chambreu
388
+ chamechambre
389
+ champre
390
+ chan
391
+ chanson
392
+ chansson
393
+ chapre
394
+ char
395
+ charré
396
+ chaso
397
+ chasschanson
398
+ chasseu
399
+ chasseur
400
+ chasson
401
+ chausson
402
+ chazon
403
+ chazzon
404
+ chch
405
+ chemichemizié
406
+ cheminchemizier
407
+ chemise
408
+ chemisier
409
+ chemizer
410
+ chemizi
411
+ chemizé
412
+ chemmizer
413
+ chenousière
414
+ chiko
415
+ chjoi
416
+ cho
417
+ choette
418
+ choideu
419
+ choil
420
+ choin
421
+ choinson
422
+ choix
423
+ choizi
424
+ chou
425
+ chouette
426
+ chouetteu
427
+ choute
428
+ choutte
429
+ chouté
430
+ chrève
431
+ chureu
432
+ chègle
433
+ chèr
434
+ chémissié
435
+ chémizié
436
+ ci
437
+ cieux
438
+ cirque
439
+ ciseau
440
+ clcleffe
441
+ clef
442
+ clefe
443
+ cleffe
444
+ cleuffe
445
+ clière
446
+ clèfe
447
+ clèffe
448
+ clécléffe
449
+ cléffe
450
+ co
451
+ cocommande
452
+ coconvcoconvalézzken
453
+ coette
454
+ coeur
455
+ coière
456
+ cojo
457
+ cokette
458
+ colavalassize
459
+ cole
460
+ colère
461
+ comandeu
462
+ comanne
463
+ commande
464
+ commen
465
+ commun
466
+ compagne
467
+ comun
468
+ con
469
+ conbalésense
470
+ confalé
471
+ confffa
472
+ conje
473
+ conjeau
474
+ conjejo
475
+ conjeul
476
+ conjon
477
+ conjé
478
+ conmande
479
+ connande
480
+ connevalésence
481
+ contisse
482
+ contuze
483
+ conval
484
+ convaleksance
485
+ convalensencente
486
+ convalescence
487
+ convalesens
488
+ convalesent
489
+ convalkslence
490
+ convalsence
491
+ convalékense
492
+ convaléksen
493
+ convaléscence
494
+ convalésence
495
+ convalésesence
496
+ convalésesesense
497
+ convaléskens
498
+ convaléssen
499
+ convalésssens
500
+ convaléséan
501
+ conzo
502
+ cor
503
+ corban
504
+ cordon
505
+ coteu
506
+ cotrer
507
+ cou
508
+ coubon
509
+ coucouette
510
+ couette
511
+ coul
512
+ couleur
513
+ couleuvre
514
+ courdon
515
+ courtain
516
+ courtir
517
+ courtié
518
+ cousse
519
+ coussette
520
+ coute
521
+ couète
522
+ coué
523
+ covaleco
524
+ covalésence
525
+ covalésonse
526
+ covasens
527
+ coère
528
+ cr
529
+ cra
530
+ cracrâne
531
+ cracréteu
532
+ craie
533
+ craine
534
+ cran
535
+ crane
536
+ craneu
537
+ cranneu
538
+ crate
539
+ cravalelle
540
+ crayon
541
+ crcrane
542
+ cre
543
+ creute
544
+ creux
545
+ crime
546
+ crin
547
+ crodon
548
+ crok
549
+ crouitien
550
+ crte
551
+ crâne
552
+ crâneu
553
+ crè
554
+ crèfe
555
+ crène
556
+ crèteu
557
+ crève
558
+ cré
559
+ crémè
560
+ crémé
561
+ crépeu
562
+ crérèf
563
+ créssizion
564
+ crétan
565
+ créteu
566
+ créveu
567
+ crêpe
568
+ crête
569
+ cucutisse
570
+ cui
571
+ cuisine
572
+ cuisiner
573
+ cuisinier
574
+ cuisinière
575
+ cuisiné
576
+ cuissetisse
577
+ cuissin
578
+ cuissineu
579
+ cuissinier
580
+ cuisson
581
+ cuizine
582
+ cuiziné
583
+ culeu
584
+ cum
585
+ curelle
586
+ cutice
587
+ cutir
588
+ cutisseu
589
+ cutissse
590
+ cutize
591
+ cutizeu
592
+ cutécutigue
593
+ cuzinié
594
+ cygogne
595
+
596
+ cécé
597
+ célié
598
+ cérf
599
+ cérfe
600
+ d
601
+ da
602
+ daba
603
+ dabe
604
+ dadante
605
+ dafffré
606
+ damadéménagé
607
+ dane
608
+ dante
609
+ davan
610
+ davdafon
611
+ dave
612
+ daveau
613
+ davon
614
+ de
615
+ dedalvo
616
+ dedoufaj
617
+ demain
618
+ deman
619
+ demande
620
+ demander
621
+ demandeu
622
+ demandé
623
+ demindemanagemen
624
+ demonde
625
+ dente
626
+ dessiner
627
+ detonde
628
+ deu
629
+ dev
630
+ devo
631
+ devé
632
+ deère
633
+ di
634
+ diche
635
+ didisse
636
+ dieu
637
+ dieux
638
+ diga
639
+ digace
640
+ digacelle
641
+ digaceuleu
642
+ digacélé
643
+ digacéséle
644
+ digalcèle
645
+ digalselle
646
+ digalèce
647
+ digcèle
648
+ digigo
649
+ diglacelle
650
+ digo
651
+ dij
652
+ dijacelle
653
+ dijaslé
654
+ dijijo
655
+ dik
656
+ dikacelle
657
+ dikacette
658
+ dikakelle
659
+ dimanche
660
+ din
661
+ dinmelle
662
+ dinoi
663
+ dinssion
664
+ dire
665
+ diré
666
+ divan
667
+ diveu
668
+ dix
669
+ diè
670
+ diège
671
+ diègue
672
+ dièrge
673
+ dié
674
+ diége
675
+ diégeu
676
+ diégueu
677
+ diégé
678
+ do
679
+ doi
680
+ doing
681
+ doir
682
+ don
683
+ dondonteu
684
+ dondé
685
+ donedé
686
+ donfage
687
+ donfaje
688
+ donné
689
+ donte
690
+ donté
691
+ doonte
692
+ dote
693
+ doujoute
694
+ doukkreukrèle
695
+ douveu
696
+ dproduikssion
697
+ dralation
698
+ drdrdrdr
699
+ drevo
700
+ drume
701
+ drècrète
702
+ drève
703
+ dréfonette
704
+ du
705
+ duddubute
706
+ dudu
707
+ duf
708
+ duie
709
+ duil
710
+ dukacelle
711
+ dumon
712
+ dupuè
713
+ durlène
714
+ duvduvé
715
+ duve
716
+ duverre
717
+ duvet
718
+ duvette
719
+ duvo
720
+ duvon
721
+ dué
722
+
723
+ débal
724
+ débar
725
+ débarakemen
726
+ débarakmen
727
+ débardemen
728
+ débardement
729
+ débarken
730
+ débarkément
731
+ débarquement
732
+ débéret
733
+ décalartion
734
+ déclar
735
+ déclaration
736
+ déclaratsion
737
+ déclarition
738
+ dédémandéménagé
739
+ défi
740
+ déglindéklarassion
741
+ dékla
742
+ déklaratsion
743
+ déklarssion
744
+ déklassion
745
+ dékrarassion
746
+ délaratio
747
+ déman
748
+ démanageme
749
+ démande
750
+ démangenassionage
751
+ démannagement
752
+ démar
753
+ démarken
754
+ démen
755
+ démengé
756
+ démeunagemen
757
+ démingemen
758
+ démédéménagedéméunnadéménagemen
759
+ déménage
760
+ déménagemen
761
+ déménagement
762
+ déménagerment
763
+ déménajmen
764
+ déménajment
765
+ dép
766
+ dépa
767
+ dépara
768
+ dépardébarquemen
769
+ déparen
770
+ déparkemen
771
+ déparquement
772
+ départdépartemen
773
+ département
774
+ départeur
775
+ départinman
776
+ départtemen
777
+ dérbéré
778
+ déré
779
+ déscala
780
+ désir
781
+ déss
782
+ déssdézir
783
+ déssi
784
+ déssir
785
+ désur
786
+ détarkemen
787
+ détromeb
788
+ dévo
789
+ dézi
790
+ e
791
+ eca
792
+ ekuatèreteur
793
+ ekuiaté
794
+ emposition
795
+ en
796
+ enjlanej
797
+ enkla
798
+ enposition
799
+ eper
800
+ epuji
801
+ equateur
802
+ eruite
803
+ es
804
+ escala
805
+ escalade
806
+ escalader
807
+ escalope
808
+ escalé
809
+ escapade
810
+ escapate
811
+ escar
812
+ escargo
813
+ escargot
814
+ esclaeskalope
815
+ esclave
816
+ escr
817
+ escroc
818
+ escrok
819
+ esescapade
820
+ eseskapade
821
+ eseskorte
822
+ esgabade
823
+ eskabbade
824
+ eskaeskalope
825
+ eskaladeu
826
+ eskalalope
827
+ eskapa
828
+ eskape
829
+ eskarlope
830
+ eskaron
831
+ eski
832
+ eskitassion
833
+ esklapin
834
+ espade
835
+ esscrok
836
+ essitatoine
837
+ estragon
838
+ estrokonkon
839
+ estrumen
840
+ etchateur
841
+ etra
842
+ etsitation
843
+ eu
844
+ eucateur
845
+ euh
846
+ eukateur
847
+ euli
848
+ eum
849
+ euscallope
850
+ euskapade
851
+ euskro
852
+ eustrumain
853
+ ex
854
+ excalope
855
+ excapade
856
+ excitation
857
+ excétation
858
+ existassion
859
+ exkro
860
+ extinteur
861
+ ezalope
862
+ f
863
+ fa
864
+ face
865
+ facile
866
+ fafème
867
+ fage
868
+ faire
869
+ fakade
870
+ fakadé
871
+ faleur
872
+ fameu
873
+ fari
874
+ farine
875
+ farkile
876
+ fass
877
+ fassadeu
878
+ fassate
879
+ fasse
880
+ fassé
881
+ façade
882
+ façadeu
883
+ façadé
884
+ feme
885
+ femme
886
+ fente
887
+ fere
888
+ ferme
889
+ feu
890
+ feufème
891
+ feumeu
892
+ feur
893
+ fezesoeur
894
+ ffar
895
+ ffflinfodireke
896
+ ffisse
897
+ ffossil
898
+ ffréfrère
899
+ ffureur
900
+ ffuzile
901
+ fi
902
+ fidomelle
903
+ fil
904
+ file
905
+ fille
906
+ fils
907
+ filsse
908
+ findre
909
+ fine
910
+ finir
911
+ finit
912
+ finte
913
+ fireu
914
+ fireur
915
+ firo
916
+ firoie
917
+ firoir
918
+ firoireu
919
+ fitivo
920
+ flandobirence
921
+ flanobirence
922
+ flemme
923
+ fleu
924
+ flinbirence
925
+ flinnobirance
926
+ flinobirence
927
+ flisse
928
+ flobirence
929
+ flonobarence
930
+ flonobirence
931
+ flumiflunobirence
932
+ flunobience
933
+ flunobirence
934
+ flunobrience
935
+ flunobrérence
936
+ flunoburence
937
+ flure
938
+ fo
939
+ foché
940
+ fofossile
941
+ fofossé
942
+ foi
943
+ foieutte
944
+ foire
945
+ foireu
946
+ foireux
947
+ foirte
948
+ foiss
949
+ foissil
950
+ foleur
951
+ folisile
952
+ folle
953
+ fon
954
+ fondo
955
+ fonile
956
+ fonobironce
957
+ for
958
+ fore
959
+ forof
960
+ foroi
961
+ foss
962
+ fosse
963
+ fossi
964
+ fossile
965
+ fossileu
966
+ fossé
967
+ fouette
968
+ four
969
+ fourdin
970
+ fozer
971
+ fozé
972
+ frer
973
+ freu
974
+ freuvandulence
975
+ frevoné
976
+ frfoir
977
+ fro
978
+ froduction
979
+ frodukssion
980
+ froi
981
+ frorari
982
+ frumiturence
983
+ frère
984
+ fré
985
+ fréreu
986
+ frésonse
987
+ frézon
988
+ ftui
989
+ fu
990
+ fufuzile
991
+ fufuzzile
992
+ fui
993
+ ful
994
+ funobirence
995
+ fur
996
+ fure
997
+ furefureur
998
+ fureu
999
+ fureur
1000
+ furfureur
1001
+ furi
1002
+ furieu
1003
+ furieur
1004
+ furor
1005
+ fus
1006
+ fusieu
1007
+ fusil
1008
+ fusile
1009
+ fusié
1010
+ fussi
1011
+ fussifussile
1012
+ fussil
1013
+ fussile
1014
+ fuz
1015
+ fuzi
1016
+ fuzil
1017
+ fuzile
1018
+ fvimineminf
1019
+
1020
+ fèbe
1021
+ fèfème
1022
+ fème
1023
+ fène
1024
+ fère
1025
+
1026
+ féfame
1027
+ féime
1028
+ fémeu
1029
+ féreu
1030
+ férmeu
1031
+ férmé
1032
+ févreu
1033
+ g
1034
+ ga
1035
+ gachon
1036
+ gagralassion
1037
+ gaon
1038
+ garcedrape
1039
+ gardon
1040
+ garçon
1041
+ gassiyeu
1042
+ gaz
1043
+ gaçon
1044
+ gelé
1045
+ getère
1046
+ geu
1047
+ gigolle
1048
+ gigot
1049
+ gigote
1050
+ glalaggralassion
1051
+ glalassion
1052
+ glgralassion
1053
+ glope
1054
+ glumon
1055
+ glève
1056
+ goix
1057
+ gordon
1058
+ gou
1059
+ goubrin
1060
+ goudin
1061
+ gour
1062
+ gourdeu
1063
+ gourdien
1064
+ gourdin
1065
+ gourgin
1066
+ gourédin
1067
+ gragarçon
1068
+ grala
1069
+ gralation
1070
+ gralaton
1071
+ gralission
1072
+ grallazton
1073
+ gralonssion
1074
+ gralssion
1075
+ gram
1076
+ grande
1077
+ grane
1078
+ granneu
1079
+ grave
1080
+ grefe
1081
+ greuèl
1082
+ grgarçon
1083
+ grgrègrève
1084
+ griive
1085
+ grise
1086
+ grugroudon
1087
+ grèffe
1088
+ grète
1089
+ grève
1090
+ grèveu
1091
+ gré
1092
+ gréve
1093
+ gréveu
1094
+ gu
1095
+ gua
1096
+ guad
1097
+ gue
1098
+ gugo
1099
+ gui
1100
+ guigguigo
1101
+ guigo
1102
+ guigro
1103
+ guin
1104
+ gumon
1105
+ gustisse
1106
+ gué
1107
+ gélamassion
1108
+ géréal
1109
+ haie
1110
+ hopeur
1111
+ hotel
1112
+ hotèl
1113
+ hotéleu
1114
+ hupeur
1115
+ héteur
1116
+ hôtel
1117
+ i
1118
+ ien
1119
+ imposs
1120
+ impozission
1121
+ incitation
1122
+ info
1123
+ inglacege
1124
+ inglage
1125
+ ininstrumen
1126
+ inite
1127
+ inkateur
1128
+ insstrumen
1129
+ instrugmen
1130
+ instruments
1131
+ instrutmen
1132
+ insézéztararagon
1133
+ intelgence
1134
+ inteli
1135
+ intelihens
1136
+ inteliégegence
1137
+ intelligence
1138
+ intelligente
1139
+ inteuligen
1140
+ intigence
1141
+ intrumen
1142
+ intrument
1143
+ intéintéligence
1144
+ intélience
1145
+ intéligen
1146
+ intéligenz
1147
+ intéligenze
1148
+ intéliyence
1149
+ intéllijen
1150
+ intér
1151
+ intéyi
1152
+ inéksitassion
1153
+ iol
1154
+ iopposisson
1155
+ iscapade
1156
+ ite
1157
+ iège
1158
+ ièiège
1159
+ j
1160
+ ja
1161
+ jadin
1162
+ jajalou
1163
+ jajou
1164
+ jajuin
1165
+ jalon
1166
+ jaloux
1167
+ jamon
1168
+ janvjanvien
1169
+ japin
1170
+ jarbli
1171
+ jardi
1172
+ jardin
1173
+ jari
1174
+ jarjardin
1175
+ jarkanien
1176
+ jarkassion
1177
+ jarkotié
1178
+ jauf
1179
+ je
1180
+ jef
1181
+ jejeul
1182
+ jen
1183
+ jeo
1184
+ jeu
1185
+ jeuf
1186
+ jeul
1187
+ jeur
1188
+ jffuzile
1189
+ ji
1190
+ jido
1191
+ jifcalssel
1192
+ jigo
1193
+ jigotte
1194
+ jijo
1195
+ jin
1196
+ jiroir
1197
+ jiéjièl
1198
+ jje
1199
+ jjoif
1200
+ jjol
1201
+ jjuin
1202
+ jo
1203
+ joeur
1204
+ jof
1205
+ joi
1206
+ joie
1207
+ joif
1208
+ joiyeu
1209
+ jojjeul
1210
+ jokassion
1211
+ jokation
1212
+ jokatssion
1213
+ jol
1214
+ joli
1215
+ jolé
1216
+ jonbark
1217
+ jor
1218
+ joraction
1219
+ jorakassion
1220
+ jorcation
1221
+ jordan
1222
+ jorkarssion
1223
+ jorkazion
1224
+ josse
1225
+ jote
1226
+ joue
1227
+ jouer
1228
+ joujeur
1229
+ jour
1230
+ jourdin
1231
+ joué
1232
+ joveu
1233
+ jozileu
1234
+ joé
1235
+ jtinjo
1236
+ ju
1237
+ juf
1238
+ jui
1239
+ juillette
1240
+ juin
1241
+ juit
1242
+ juite
1243
+ jujuillé
1244
+ jukurelle
1245
+ junu
1246
+ jus
1247
+ jué
1248
+
1249
+ jégal
1250
+ jéjande
1251
+ jérègle
1252
+ jété
1253
+ jéziègue
1254
+ ka
1255
+ kaeskalope
1256
+ kagésson
1257
+ kakakatastrof
1258
+ kaleur
1259
+ kaltié
1260
+ kaskade
1261
+ ke
1262
+ kekoeur
1263
+ keltié
1264
+ kereu
1265
+ kesér
1266
+ keu
1267
+ keureuf
1268
+ kieu
1269
+ kili
1270
+ koi
1271
+ kojo
1272
+ komate
1273
+ koué
1274
+ krcarré
1275
+ ksulisque
1276
+ kuesseu
1277
+ kui
1278
+ kurguel
1279
+ kèrfe
1280
+ kégo
1281
+ kél
1282
+ kélier
1283
+ kélk
1284
+ kér
1285
+ l
1286
+ la
1287
+ ladon
1288
+ lait
1289
+ lalardon
1290
+ lalon
1291
+ lamalédikssion
1292
+ laman
1293
+ lamon
1294
+ lanmon
1295
+ larbo
1296
+ lardo
1297
+ lardon
1298
+ lardron
1299
+ larlarbonne
1300
+ larlardon
1301
+ laver
1302
+ lejejeur
1303
+ lemèce
1304
+ len
1305
+ lenen
1306
+ lenmon
1307
+ li
1308
+ liché
1309
+ lie
1310
+ lieux
1311
+ lije
1312
+ lijo
1313
+ liju
1314
+ likoi
1315
+ liliège
1316
+ lin
1317
+ linjon
1318
+ liojlièjeu
1319
+ lion
1320
+ lir
1321
+ lis
1322
+ lisoi
1323
+ lisoie
1324
+ lisso
1325
+ lissoi
1326
+ lissoie
1327
+ lissoir
1328
+ lissoire
1329
+ livanette
1330
+ live
1331
+ livre
1332
+ lizlizoil
1333
+ lizoille
1334
+ liède
1335
+ liège
1336
+ liègeu
1337
+ lié
1338
+ liégle
1339
+ liéliège
1340
+ llamon
1341
+ lli
1342
+ llizoi
1343
+ llojie
1344
+ llé
1345
+ lo
1346
+ lode
1347
+ lof
1348
+ logis
1349
+ logisse
1350
+ logui
1351
+ loguie
1352
+ loi
1353
+ loif
1354
+ loife
1355
+ loin
1356
+ loir
1357
+ loizlizoi
1358
+ lologie
1359
+ lon
1360
+ loro
1361
+ loti
1362
+ loveu
1363
+ lui
1364
+ luif
1365
+ lumi
1366
+ lumimèce
1367
+ luminesse
1368
+ lumize
1369
+ lumizeu
1370
+ lumièce
1371
+ lumèce
1372
+ lumèke
1373
+ lumère
1374
+ luméke
1375
+ lumémèce
1376
+ lumézeu
1377
+ luni
1378
+ lurlieume
1379
+ lège
1380
+ lèt
1381
+ léande
1382
+ léche
1383
+ légen
1384
+ légende
1385
+ légendeu
1386
+ léginde
1387
+ léguande
1388
+ léguendeu
1389
+ légènede
1390
+ légé
1391
+ léjime
1392
+ léjé
1393
+ léliège
1394
+ léliègue
1395
+ léléssir
1396
+ lémlumèce
1397
+ léssoir
1398
+ m
1399
+ ma
1400
+ mai
1401
+ mail
1402
+ maizon
1403
+ maje
1404
+ malade
1405
+ malin
1406
+ malé
1407
+ malédichian
1408
+ malédicssion
1409
+ malédiction
1410
+ malédission
1411
+ malézik
1412
+ mamamalia
1413
+ mamour
1414
+ man
1415
+ mananivéleu
1416
+ manfelle
1417
+ mani
1418
+ manifé
1419
+ manimanivelle
1420
+ manivele
1421
+ manivelle
1422
+ manon
1423
+ manvielle
1424
+ marabeu
1425
+ mardé
1426
+ marmirabèle
1427
+ matik
1428
+ matin
1429
+ me
1430
+ meil
1431
+ mel
1432
+ memalédiction
1433
+ memeuil
1434
+ mendi
1435
+ menimenizé
1436
+ menizier
1437
+ meniémeil
1438
+ mennuizé
1439
+ menouizié
1440
+ menuiser
1441
+ menuisier
1442
+ menuisié
1443
+ menuisse
1444
+ menuissier
1445
+ menuissière
1446
+ menuizer
1447
+ menuizé
1448
+ menusine
1449
+ menuzier
1450
+ mené
1451
+ meo
1452
+ meu
1453
+ meuble
1454
+ meuil
1455
+ meul
1456
+ meunusier
1457
+ mfa
1458
+ mi
1459
+ michion
1460
+ midéminagemen
1461
+ miel
1462
+ mieu
1463
+ mieuil
1464
+ mieul
1465
+ mijemeu
1466
+ mil
1467
+ mileu
1468
+ mileven
1469
+ milevin
1470
+ milfené
1471
+ milieu
1472
+ mille
1473
+ million
1474
+ milon
1475
+ milvainné
1476
+ milvan
1477
+ milvane
1478
+ milvanné
1479
+ milvavène
1480
+ milven
1481
+ milvenet
1482
+ milvenette
1483
+ milveneu
1484
+ milvenmilvenné
1485
+ milvenné
1486
+ milvenu
1487
+ milvin
1488
+ milvinvène
1489
+ milvéné
1490
+ miléneven
1491
+ mimille
1492
+ mimilvinnette
1493
+ mimiziion
1494
+ mine
1495
+ minion
1496
+ minlémalédikssion
1497
+ minoi
1498
+ minon
1499
+ mion
1500
+ mirabelle
1501
+ mirabeul
1502
+ mirablbelle
1503
+ mirable
1504
+ mirableu
1505
+ miro
1506
+ mission
1507
+ misson
1508
+ mitaple
1509
+ mive
1510
+ miveu
1511
+ miye
1512
+ miyon
1513
+ mizion
1514
+ mizon
1515
+ mié
1516
+ mmaizon
1517
+ mmalédikssion
1518
+ mmenuzié
1519
+ mmeul
1520
+ mmieul
1521
+ mmillion
1522
+ mmmeuil
1523
+ mmméil
1524
+ mmoizon
1525
+ mnaan
1526
+ moi
1527
+ moichon
1528
+ moil
1529
+ moimoisson
1530
+ moireu
1531
+ moiss
1532
+ moission
1533
+ moisson
1534
+ moizin
1535
+ moizon
1536
+ momosson
1537
+ mon
1538
+ mondre
1539
+ monmoisson
1540
+ moti
1541
+ motik
1542
+ motte
1543
+ mou
1544
+ mouelle
1545
+ mouette
1546
+ mouler
1547
+ mounon
1548
+ mouton
1549
+ moutte
1550
+ moutteu
1551
+ mu
1552
+ muette
1553
+ mule
1554
+ mulen
1555
+ mumon
1556
+ munien
1557
+ muno
1558
+ munoi
1559
+ munon
1560
+ munone
1561
+ munou
1562
+ mèive
1563
+
1564
+ méil
1565
+ mék
1566
+ méla
1567
+ méladikssion
1568
+ mélitétion
1569
+ mélivelle
1570
+ mélédiction
1571
+ mémoizon
1572
+ ménuizier
1573
+ ménusier
1574
+ méss
1575
+ méta
1576
+ métal
1577
+ métik
1578
+ mézion
1579
+ mézon
1580
+ n
1581
+ na
1582
+ nadré
1583
+ nadé
1584
+ nanardé
1585
+ nar
1586
+ nardeu
1587
+ nardé
1588
+ narndé
1589
+ naré
1590
+ nave
1591
+ navet
1592
+ navette
1593
+ nif
1594
+ nife
1595
+ ninnoi
1596
+ ninoie
1597
+ ninoir
1598
+ nisoigne
1599
+ nisse
1600
+ nive
1601
+ niveau
1602
+ niveu
1603
+ nivin
1604
+ nivo
1605
+ nivon
1606
+ nièle
1607
+ nmoé
1608
+ nnomembre
1609
+ nobreu
1610
+ noi
1611
+ noir
1612
+ noix
1613
+ nombre
1614
+ nombreu
1615
+ nomi
1616
+ nomouite
1617
+ non
1618
+ norme
1619
+ nou
1620
+ nounombre
1621
+ nouvé
1622
+ nu
1623
+ nuit
1624
+ nunoi
1625
+ nué
1626
+ néta
1627
+ o
1628
+ obsession
1629
+ obsition
1630
+ ocher
1631
+ ochochèstre
1632
+ ochèstretre
1633
+ ocugère
1634
+ ocujé
1635
+ ol
1636
+ olotèl
1637
+ olé
1638
+ on
1639
+ ootel
1640
+ op
1641
+ ope
1642
+ opezission
1643
+ opission
1644
+ oposission
1645
+ oposithion
1646
+ opositive
1647
+ opossission
1648
+ opozission
1649
+ opposilien
1650
+ opposission
1651
+ opposition
1652
+ oppsopeopozission
1653
+ opssion
1654
+ orch
1655
+ orchchestre
1656
+ orchestre
1657
+ orcheur
1658
+ orchtestre
1659
+ orchère
1660
+ orchèstre
1661
+ orchètreu
1662
+ orchéteu
1663
+ orkassion
1664
+ osuk
1665
+ ote
1666
+ oteje
1667
+ otlo
1668
+ oto
1669
+ ototl
1670
+ otél
1671
+ ou
1672
+ ouaoute
1673
+ oug
1674
+ oui
1675
+ oute
1676
+ oué
1677
+ p
1678
+ pa
1679
+ pabble
1680
+ pade
1681
+ padiège
1682
+ padon
1683
+ page
1684
+ pain
1685
+ painte
1686
+ pair
1687
+ pakosso
1688
+ pamon
1689
+ pan
1690
+ panbandi
1691
+ panjo
1692
+ papansson
1693
+ papati
1694
+ papppréné
1695
+ par
1696
+ parace
1697
+ parade
1698
+ paradeu
1699
+ paraparosse
1700
+ parasse
1701
+ parate
1702
+ parcor
1703
+ parcosse
1704
+ parden
1705
+ pardon
1706
+ pare
1707
+ parerosse
1708
+ pari
1709
+ park
1710
+ parkok
1711
+ paroce
1712
+ parodeu
1713
+ parohe
1714
+ parok
1715
+ paron
1716
+ paroparoce
1717
+ paroque
1718
+ parose
1719
+ parosse
1720
+ parosso
1721
+ parparasdeu
1722
+ parrosse
1723
+ parrpa
1724
+ parte
1725
+ partérission
1726
+ paré
1727
+ pasket
1728
+ paské
1729
+ paspaspaské
1730
+ passade
1731
+ passé
1732
+ pate
1733
+ pati
1734
+ patin
1735
+ paton
1736
+ peine
1737
+ peiner
1738
+ pelle
1739
+ pen
1740
+ pendeu
1741
+ pendu
1742
+ penjo
1743
+ pensan
1744
+ pente
1745
+ penteu
1746
+ pentu
1747
+ penté
1748
+ pepompi
1749
+ per
1750
+ perdan
1751
+ perné
1752
+ petite
1753
+ peu
1754
+ peul
1755
+ peureu
1756
+ phème
1757
+ pi
1758
+ pierre
1759
+ pin
1760
+ pince
1761
+ pinceau
1762
+ pinde
1763
+ pineson
1764
+ pinja
1765
+ pinjo
1766
+ pinpinzon
1767
+ pinson
1768
+ pinssan
1769
+ pinsso
1770
+ pinte
1771
+ pinzon
1772
+ pira
1773
+ pireau
1774
+ pirre
1775
+ pisson
1776
+ pizio
1777
+ pièce
1778
+ piège
1779
+ pié
1780
+ piégeu
1781
+ piéjeu
1782
+ piéjé
1783
+ plafassion
1784
+ plaftion
1785
+ plan
1786
+ plank
1787
+ pleur
1788
+ pli
1789
+ plui
1790
+ pluli
1791
+ plumidudrence
1792
+ pléfasson
1793
+ pléfation
1794
+ plépléfakssion
1795
+ plétion
1796
+ po
1797
+ podeu
1798
+ poi
1799
+ poide
1800
+ poids
1801
+ poilleu
1802
+ poin
1803
+ poipoir
1804
+ poir
1805
+ poire
1806
+ poireu
1807
+ pokarelle
1808
+ poliil
1809
+ polo
1810
+ pom
1811
+ pommier
1812
+ pompier
1813
+ pompompié
1814
+ pomé
1815
+ pon
1816
+ ponbi
1817
+ ponceur
1818
+ ponde
1819
+ ponjeur
1820
+ ponjo
1821
+ ponssoimisse
1822
+ ponte
1823
+ popromié
1824
+ poreu
1825
+ porosse
1826
+ porte
1827
+ position
1828
+ pospil
1829
+ potoi
1830
+ pouille
1831
+ poulo
1832
+ poulon
1833
+ pousser
1834
+ pparoke
1835
+ prafoné
1836
+ pre
1837
+ prefassion
1838
+ premié
1839
+ prené
1840
+ prio
1841
+ priro
1842
+ pro
1843
+ produ
1844
+ producteur
1845
+ production
1846
+ produhion
1847
+ produi
1848
+ produiprodukssion
1849
+ produission
1850
+ produitssion
1851
+ produizé
1852
+ produkprodukssion
1853
+ produktsion
1854
+ profil
1855
+ promier
1856
+ protik
1857
+ prprékizion
1858
+ prète
1859
+ pré
1860
+ prébrètze
1861
+ précision
1862
+ prédizion
1863
+ prédé
1864
+ préfassion
1865
+ préfazion
1866
+ préné
1867
+ prépréssizion
1868
+ préreu
1869
+ prés
1870
+ préssion
1871
+ préssision
1872
+ ptil
1873
+ pu
1874
+ pudi
1875
+ pui
1876
+ pukurelle
1877
+ pul
1878
+ puli
1879
+ pului
1880
+ pâté
1881
+ pème
1882
+
1883
+ péme
1884
+ péné
1885
+ péplé
1886
+ pér
1887
+ péreu
1888
+ pérmé
1889
+ pérne
1890
+ pérperné
1891
+ péyerle
1892
+ que
1893
+ quelle
1894
+ r
1895
+ ra
1896
+ radission
1897
+ raie
1898
+ raifeul
1899
+ rajir
1900
+ rajo
1901
+ rak
1902
+ raklème
1903
+ ralassion
1904
+ raperaptil
1905
+ rapide
1906
+ rapleme
1907
+ raplement
1908
+ raplème
1909
+ raplé
1910
+ raplémen
1911
+ rapléraplème
1912
+ rapèl
1913
+ rapèle
1914
+ rarari
1915
+ rari
1916
+ re
1917
+ recolésence
1918
+ reconaissant
1919
+ reconaissation
1920
+ reconession
1921
+ reconnaissan
1922
+ reconnaissance
1923
+ reconnexion
1924
+ reconésonce
1925
+ reconéssan
1926
+ redré
1927
+ regale
1928
+ regar
1929
+ regarde
1930
+ regaregarer
1931
+ regaréregré
1932
+ regran
1933
+ regre
1934
+ regret
1935
+ regrette
1936
+ regrète
1937
+ reite
1938
+ rejeu
1939
+ rejo
1940
+ rejoin
1941
+ reka
1942
+ rekal
1943
+ rekokannaissa
1944
+ rekonésene
1945
+ rekonésense
1946
+ rekonéssance
1947
+ rel
1948
+ rembage
1949
+ remplèmeu
1950
+ renbage
1951
+ rengal
1952
+ renije
1953
+ renjo
1954
+ reno
1955
+ renéssance
1956
+ rep
1957
+ repli
1958
+ repti
1959
+ reptil
1960
+ reptile
1961
+ reri
1962
+ reuf
1963
+ reuil
1964
+ reul
1965
+ reupti
1966
+ reux
1967
+ rex
1968
+ reyeu
1969
+ rf
1970
+ ri
1971
+ riri
1972
+ riss
1973
+ rix
1974
+ rkkacrane
1975
+ ro
1976
+ robac
1977
+ robage
1978
+ rochon
1979
+ rof
1980
+ roglé
1981
+ rogré
1982
+ roille
1983
+ rojo
1984
+ rombage
1985
+ rombague
1986
+ rombbbage
1987
+ romebage
1988
+ ron
1989
+ ronb
1990
+ ronba
1991
+ ronbache
1992
+ ronbageu
1993
+ ronbague
1994
+ rondage
1995
+ rongajeu
1996
+ ronge
1997
+ ronje
1998
+ ronjeau
1999
+ ronjer
2000
+ ronjeu
2001
+ ronjeur
2002
+ ronjronjo
2003
+ ronpajeu
2004
+ rorcheustre
2005
+ rore
2006
+ rorozié
2007
+ rosier
2008
+ rossier
2009
+ rossié
2010
+ roujo
2011
+ rouondin
2012
+ rozer
2013
+ rrarrari
2014
+ rrerei
2015
+ rreu
2016
+ rron
2017
+ rréégl
2018
+ ru
2019
+ ruconnaissant
2020
+ rueil
2021
+ ruelle
2022
+ rugite
2023
+ rui
2024
+ ruil
2025
+ ruit
2026
+ ruite
2027
+ rupitile
2028
+ rute
2029
+ ruyi
2030
+ rège
2031
+ règle
2032
+
2033
+ récal
2034
+ récit
2035
+ récite
2036
+ récitte
2037
+ réclamation
2038
+ réconsens
2039
+ réconéssanste
2040
+ rédale
2041
+ rég
2042
+ régal
2043
+ régala
2044
+ régale
2045
+ régla
2046
+ réglamation
2047
+ régol
2048
+ régrette
2049
+ régrè
2050
+ régré
2051
+ réil
2052
+ réiu
2053
+ réjen
2054
+ rékal
2055
+ rékalassion
2056
+ rékaréklamassion
2057
+ réki
2058
+ réklam
2059
+ réklamass
2060
+ rékonéssense
2061
+ rékré
2062
+ réksi
2063
+ rémé
2064
+ répiptil
2065
+ réptileu
2066
+ réptimblje
2067
+ réregré
2068
+ rérenjjo
2069
+ réréssi
2070
+ réssite
2071
+ rété
2072
+ s
2073
+ sa
2074
+ saison
2075
+ saleur
2076
+ salon
2077
+ salope
2078
+ salor
2079
+ san
2080
+ sanson
2081
+ sasaison
2082
+ satte
2083
+ scass
2084
+ sco
2085
+ se
2086
+ secret
2087
+ sekelié
2088
+ selié
2089
+ sembreu
2090
+ sension
2091
+ sentin
2092
+ sep
2093
+ seppe
2094
+ sept
2095
+ septre
2096
+ sesalade
2097
+ sesèle
2098
+ sette
2099
+ settecr
2100
+ seukrgreu
2101
+ seup
2102
+ seurf
2103
+ seuripeul
2104
+ sgourdin
2105
+ si
2106
+ siason
2107
+ sibomelle
2108
+ side
2109
+ sidomelle
2110
+ sidomesidome
2111
+ sidomène
2112
+ sidoméleu
2113
+ sidonelle
2114
+ sienjejo
2115
+ sieuge
2116
+ sigomeleu
2117
+ siiss
2118
+ sik
2119
+ sinomelle
2120
+ siroi
2121
+ sission
2122
+ situ
2123
+ situsitile
2124
+ six
2125
+ siège
2126
+ siègeu
2127
+ siègne
2128
+ sièrge
2129
+ sié
2130
+ siégeu
2131
+ siésiège
2132
+ skalate
2133
+ skré
2134
+ skèrfe
2135
+ sleu
2136
+ slèfe
2137
+ sléfe
2138
+ so
2139
+ soer
2140
+ soeur
2141
+ soi
2142
+ sonjo
2143
+ sor
2144
+ sorbil
2145
+ sorbileu
2146
+ sorbisorpilé
2147
+ sorpile
2148
+ sorpille
2149
+ sorpilo
2150
+ sorpilé
2151
+ sorpli
2152
+ sorplip
2153
+ sotonne
2154
+ soté
2155
+ souette
2156
+ sousouette
2157
+ spoporpil
2158
+ sps
2159
+ spétte
2160
+ sse
2161
+ sselié
2162
+ ssi
2163
+ ssidomelle
2164
+ ssorpil
2165
+ ssorr
2166
+ sssleffe
2167
+ ssstyle
2168
+ sstyleu
2169
+ ssuf
2170
+ st
2171
+ sta
2172
+ stab
2173
+ stade
2174
+ stadeu
2175
+ stage
2176
+ stand
2177
+ stande
2178
+ star
2179
+ state
2180
+ stin
2181
+ stiten
2182
+ strastastade
2183
+ stress
2184
+ strudemen
2185
+ stsije
2186
+ ststylé
2187
+ sttpan
2188
+ stttyle
2189
+ stuil
2190
+ style
2191
+ styleu
2192
+ stylo
2193
+ su
2194
+ sueur
2195
+ suf
2196
+ sui
2197
+ suirfené
2198
+ suisi
2199
+ suissiné
2200
+ suite
2201
+ sujel
2202
+ suli
2203
+ supo
2204
+ support
2205
+ sureur
2206
+ suzinier
2207
+ sècre
2208
+ sècrè
2209
+ sèpt
2210
+
2211
+ sécré
2212
+ sédomelle
2213
+ sékré
2214
+ sémézon
2215
+ séré
2216
+ sésette
2217
+ séssan
2218
+ sésson
2219
+ sété
2220
+ séège
2221
+ t
2222
+ ta
2223
+ tab
2224
+ taba
2225
+ tabac
2226
+ tabak
2227
+ tablak
2228
+ tableu
2229
+ tabo
2230
+ tajo
2231
+ tak
2232
+ tanbé
2233
+ tanjeau
2234
+ tanjeu
2235
+ tanjeune
2236
+ tanzieu
2237
+ tap
2238
+ tapla
2239
+ tarpardission
2240
+ task
2241
+ tassier
2242
+ tataba
2243
+ tavo
2244
+ tbavo
2245
+ tchi
2246
+ tchiètche
2247
+ tchtui
2248
+ te
2249
+ teije
2250
+ tembé
2251
+ ten
2252
+ tenkssion
2253
+ tenshion
2254
+ tension
2255
+ tenson
2256
+ tente
2257
+ tentension
2258
+ tenteu
2259
+ ter
2260
+ tetisse
2261
+ teur
2262
+ tevu
2263
+ ti
2264
+ tibuné
2265
+ tieux
2266
+ tifo
2267
+ tij
2268
+ tikre
2269
+ tilieu
2270
+ timbe
2271
+ timbre
2272
+ timbreu
2273
+ time
2274
+ timebe
2275
+ timebre
2276
+ timebuné
2277
+ timepinminé
2278
+ timepinpuné
2279
+ timepune
2280
+ timepuné
2281
+ timetimbre
2282
+ timponé
2283
+ timpunet
2284
+ timpunette
2285
+ timpur
2286
+ tin
2287
+ tinjo
2288
+ tinpulé
2289
+ tinpune
2290
+ tinpunette
2291
+ tinsio
2292
+ tinsion
2293
+ tinssion
2294
+ tinte
2295
+ tipil
2296
+ tipinpune
2297
+ tipune
2298
+ tipunette
2299
+ tirl
2300
+ tite
2301
+ titinpuné
2302
+ titivo
2303
+ titjigacèle
2304
+ tive
2305
+ tiveau
2306
+ tiveo
2307
+ tiveu
2308
+ tivévé
2309
+ tiz
2310
+ tiège
2311
+ tiègre
2312
+ tière
2313
+ tié
2314
+ tiégre
2315
+ tiégue
2316
+ toi
2317
+ toir
2318
+ toire
2319
+ toit
2320
+ toite
2321
+ ton
2322
+ tonbage
2323
+ tonbé
2324
+ tonde
2325
+ tondonté
2326
+ tondé
2327
+ tonjo
2328
+ tonjoruiyé
2329
+ tonte
2330
+ tonté
2331
+ tonvaléscence
2332
+ top
2333
+ toudé
2334
+ toulotte
2335
+ tovo
2336
+ tozion
2337
+ tr
2338
+ trabition
2339
+ tradeu
2340
+ traditien
2341
+ tradition
2342
+ traditon
2343
+ traditsien
2344
+ traditssion
2345
+ tradjission
2346
+ train
2347
+ trank
2348
+ trapi
2349
+ tre
2350
+ trefon
2351
+ trefone
2352
+ trefonet
2353
+ trefonne
2354
+ trevoné
2355
+ tribe
2356
+ trime
2357
+ trin
2358
+ trinbe
2359
+ trindission
2360
+ trié
2361
+ trobo
2362
+ trofeneu
2363
+ troi
2364
+ troir
2365
+ tronc
2366
+ tronfondulence
2367
+ tronk
2368
+ trtradission
2369
+ trtréfoné
2370
+ tru
2371
+ trufodulence
2372
+ trufon
2373
+ trufondelence
2374
+ trufondulen
2375
+ trufondulence
2376
+ trufondulenze
2377
+ trufondulsen
2378
+ trulèbe
2379
+ trulème
2380
+ trulé
2381
+ trèbe
2382
+ trèbeu
2383
+ trège
2384
+ trème
2385
+ trèmejol
2386
+ trèmeu
2387
+ trèp
2388
+ trètrème
2389
+ trève
2390
+ trèème
2391
+ tré
2392
+ trébe
2393
+ trébeu
2394
+ trébi
2395
+ trébo
2396
+ trébé
2397
+ tréchfoné
2398
+ trédission
2399
+ tréfondé
2400
+ tréfoué
2401
+ trémé
2402
+ trénte
2403
+ trépe
2404
+ trétraire
2405
+ tsepé
2406
+ tstimbre
2407
+ ttrifudulence
2408
+ ttrotrefeufoé
2409
+ tu
2410
+ tudisse
2411
+ tufondusse
2412
+ tuie
2413
+ tuil
2414
+ tuile
2415
+ tuit
2416
+ tuite
2417
+ tuji
2418
+ tujil
2419
+ tulème
2420
+ tulémeu
2421
+ tumon
2422
+ tupeur
2423
+ tupune
2424
+ tur
2425
+ turfontulen
2426
+ turleme
2427
+ turlèlme
2428
+ turlème
2429
+ turlèvme
2430
+ turte
2431
+ tut
2432
+ tute
2433
+ tutisse
2434
+ tuve
2435
+ tuèl
2436
+
2437
+ tébré
2438
+ tégacelle
2439
+ téjé
2440
+ téligence
2441
+ témpuné
2442
+ témé
2443
+ térpin
2444
+ téré
2445
+ u
2446
+ un
2447
+ upeur
2448
+ upr
2449
+ upré
2450
+ upér
2451
+ utéligen
2452
+ vagen
2453
+ vagin
2454
+ vakan
2455
+ val
2456
+ vale
2457
+ valeor
2458
+ valet
2459
+ valette
2460
+ valeur
2461
+ valvoleur
2462
+ valéintan
2463
+ vaçade
2464
+ ven
2465
+ vendre
2466
+ venjo
2467
+ venleur
2468
+ vent
2469
+ vente
2470
+ venteu
2471
+ ventre
2472
+ vi
2473
+ vidange
2474
+ vindeu
2475
+ vingt
2476
+ vingte
2477
+ vinte
2478
+ vite
2479
+ vitive
2480
+ vitivo
2481
+ vive
2482
+ vivo
2483
+ vo
2484
+ voileur
2485
+ voir
2486
+ voix
2487
+ voleur
2488
+ voleureu
2489
+ volo
2490
+ volé
2491
+ vor
2492
+ vot
2493
+ vou
2494
+ vvaleur
2495
+ vvente
2496
+ vvoleur
2497
+ ye
2498
+ zeu
2499
+ zeusse
2500
+ zeux
2501
+ zezeu
2502
+ zezu
2503
+ zidolmelle
2504
+ zieu
2505
+ zigo
2506
+ ziège
2507
+ zor
2508
+ zorkassion
2509
+ zouinezozzou
2510
+ zu
2511
+ zuin
2512
+
2513
+  lieu
2514
+ écal
2515
+ écapade
2516
+ écho
2517
+ éclalope
2518
+ écouteur
2519
+ écro
2520
+ écu
2521
+ écuirékouère
2522
+ écuière
2523
+ écureuil
2524
+ écurieère
2525
+ écuririe
2526
+ écuyière
2527
+ écuyère
2528
+ éeu
2529
+ églaminssion
2530
+ égro
2531
+ éguillèreu
2532
+ éguière
2533
+ égzékssitassion
2534
+ éka
2535
+ ékabade
2536
+ ékadteur
2537
+ ékajade
2538
+ ékakeur
2539
+ ékalade
2540
+ ékalajade
2541
+ ékalope
2542
+ ékapadeu
2543
+ ékart
2544
+ ékarteur
2545
+ ékateu
2546
+ ékateur
2547
+ ékaékateur
2548
+ ékaéquaékaéquateur
2549
+ éke
2550
+ ékitassion
2551
+ ékkitation
2552
+ ékosse
2553
+ ékouteur
2554
+ ékrkro
2555
+ ékro
2556
+ ékrok
2557
+ éksitass
2558
+ ékstaze
2559
+ ékuière
2560
+ ékuiécureuil
2561
+ ékukuiyère
2562
+ ékunteur
2563
+ ékurié
2564
+ ékurékuiéyère
2565
+ ékuyère
2566
+ ékuékuiyère
2567
+ élieur
2568
+ élou
2569
+ élève
2570
+ élévemen
2571
+ éléveu
2572
+ épeur
2573
+ épogneu
2574
+ épozission
2575
+ épozition
2576
+ épozizion
2577
+ éra
2578
+ éragon
2579
+ és
2580
+ ésalope
2581
+ ésalopeu
2582
+ éscalope
2583
+ éscor
2584
+ éscrotke
2585
+ ésgapade
2586
+ ésita
2587
+ éska
2588
+ éskalaéskalope
2589
+ éskaléskalade
2590
+ éskapadeu
2591
+ éske
2592
+ éskor
2593
+ éskork
2594
+ éskrok
2595
+ éskrosse
2596
+ éskrégon
2597
+ éssaescalade
2598
+ éssaééskapade
2599
+ éssitassion
2600
+ éssitation
2601
+ éssssitation
2602
+ ésstringon
2603
+ ésséyer
2604
+ éstragnon
2605
+ éstraon
2606
+ éstrengon
2607
+ éstringongon
2608
+ éséskalade
2609
+ éséskapade
2610
+ éséstragon
2611
+ étage
2612
+ étar
2613
+ étassion
2614
+ étor
2615
+ étra
2616
+ étragon
2617
+ étrajon
2618
+ étrangean
2619
+ étraon
2620
+ étrayon
2621
+ étél
2622
+ étéligen
2623
+ étér
2624
+ ététeur
2625
+ évou
2626
+ éékalopeu
2627
+ éékapate
2628
+ ééskalope
2629
+ ééteur
2630
+ ôte
log_mozilla-foundation_common_voice_8_0_fr_test_predictions.txt ADDED
The diff for this file is too large to render. See raw diff
 
log_mozilla-foundation_common_voice_8_0_fr_test_predictions_greedy.txt ADDED
The diff for this file is too large to render. See raw diff
 
log_mozilla-foundation_common_voice_8_0_fr_test_targets.txt ADDED
The diff for this file is too large to render. See raw diff
 
log_mozilla-foundation_common_voice_8_0_fr_test_targets_greedy.txt ADDED
The diff for this file is too large to render. See raw diff
 
log_speech-recognition-community-v2_dev_data_fr_validation_predictions.txt ADDED
The diff for this file is too large to render. See raw diff
 
log_speech-recognition-community-v2_dev_data_fr_validation_predictions_greedy.txt ADDED
The diff for this file is too large to render. See raw diff
 
log_speech-recognition-community-v2_dev_data_fr_validation_targets.txt ADDED
The diff for this file is too large to render. See raw diff
 
mozilla-foundation_common_voice_8_0_fr_test_eval_results.txt ADDED
@@ -0,0 +1,2 @@
 
 
 
1
+ WER: 0.16320660093488012
2
+ CER: 0.04213180710602369
mozilla-foundation_common_voice_8_0_fr_test_eval_results_greedy.txt ADDED
@@ -0,0 +1,2 @@
 
 
 
1
+ WER: 0.168549674179772
2
+ CER: 0.046693488978296595
preprocessor_config.json ADDED
@@ -0,0 +1,10 @@
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "do_normalize": true,
3
+ "feature_extractor_type": "Wav2Vec2FeatureExtractor",
4
+ "feature_size": 1,
5
+ "padding_side": "right",
6
+ "padding_value": 0,
7
+ "processor_class": "Wav2Vec2ProcessorWithLM",
8
+ "return_attention_mask": true,
9
+ "sampling_rate": 16000
10
+ }
pytorch_model.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c526b57c0fa8c775ae10130211e8e6ea900c5c3b89e10ad13651f2c35326a482
3
+ size 3850553521
special_tokens_map.json ADDED
@@ -0,0 +1,6 @@
 
 
 
 
 
 
 
1
+ {
2
+ "bos_token": "<s>",
3
+ "eos_token": "</s>",
4
+ "pad_token": "<pad>",
5
+ "unk_token": "<unk>"
6
+ }
speech-recognition-community-v2_dev_data_fr_validation_eval_results.txt ADDED
@@ -0,0 +1,2 @@
 
 
 
1
+ WER: 0.1716189447145687
2
+ CER: 0.09386097249622839
speech-recognition-community-v2_dev_data_fr_validation_eval_results_greedy.txt ADDED
@@ -0,0 +1,2 @@
 
 
 
1
+ WER: 0.22343778137943454
2
+ CER: 0.09883563498510696
tokenizer_config.json ADDED
@@ -0,0 +1,48 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "added_tokens_decoder": {
3
+ "0": {
4
+ "content": "<pad>",
5
+ "lstrip": true,
6
+ "normalized": false,
7
+ "rstrip": true,
8
+ "single_word": false,
9
+ "special": false
10
+ },
11
+ "1": {
12
+ "content": "<s>",
13
+ "lstrip": true,
14
+ "normalized": false,
15
+ "rstrip": true,
16
+ "single_word": false,
17
+ "special": false
18
+ },
19
+ "2": {
20
+ "content": "</s>",
21
+ "lstrip": true,
22
+ "normalized": false,
23
+ "rstrip": true,
24
+ "single_word": false,
25
+ "special": false
26
+ },
27
+ "3": {
28
+ "content": "<unk>",
29
+ "lstrip": true,
30
+ "normalized": false,
31
+ "rstrip": true,
32
+ "single_word": false,
33
+ "special": false
34
+ }
35
+ },
36
+ "bos_token": "<s>",
37
+ "clean_up_tokenization_spaces": true,
38
+ "do_lower_case": false,
39
+ "eos_token": "</s>",
40
+ "model_max_length": 1000000000000000019884624838656,
41
+ "pad_token": "<pad>",
42
+ "processor_class": "Wav2Vec2ProcessorWithLM",
43
+ "replace_word_delimiter_char": " ",
44
+ "target_lang": null,
45
+ "tokenizer_class": "Wav2Vec2CTCTokenizer",
46
+ "unk_token": "<unk>",
47
+ "word_delimiter_token": "|"
48
+ }
vocab.json ADDED
@@ -0,0 +1,49 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "'": 5,
3
+ "-": 6,
4
+ "</s>": 2,
5
+ "<pad>": 0,
6
+ "<s>": 1,
7
+ "<unk>": 3,
8
+ "a": 7,
9
+ "b": 8,
10
+ "c": 9,
11
+ "d": 10,
12
+ "e": 11,
13
+ "f": 12,
14
+ "g": 13,
15
+ "h": 14,
16
+ "i": 15,
17
+ "j": 16,
18
+ "k": 17,
19
+ "l": 18,
20
+ "m": 19,
21
+ "n": 20,
22
+ "o": 21,
23
+ "p": 22,
24
+ "q": 23,
25
+ "r": 24,
26
+ "s": 25,
27
+ "t": 26,
28
+ "u": 27,
29
+ "v": 28,
30
+ "w": 29,
31
+ "x": 30,
32
+ "y": 31,
33
+ "z": 32,
34
+ "|": 4,
35
+ "à": 33,
36
+ "â": 34,
37
+ "ã": 35,
38
+ "ç": 36,
39
+ "è": 37,
40
+ "é": 38,
41
+ "ê": 39,
42
+ "ë": 40,
43
+ "î": 41,
44
+ "ï": 42,
45
+ "ô": 43,
46
+ "ù": 44,
47
+ "û": 45,
48
+ "œ": 46
49
+ }