joaoalvarenga commited on
Commit
2c9efbe
1 Parent(s): fc61f67

Update README.md

Browse files
Files changed (1) hide show
  1. README.md +5 -5
README.md CHANGED
@@ -49,8 +49,8 @@ from transformers import Wav2Vec2ForCTC, Wav2Vec2Processor
49
 
50
  test_dataset = load_dataset("common_voice", "pt", split="test[:2%]")
51
 
52
- processor = Wav2Vec2Processor.from_pretrained("joorock12/wav2vec2-large-xlsr-53-portuguese")
53
- model = Wav2Vec2ForCTC.from_pretrained("joorock12/wav2vec2-large-xlsr-53-portuguese")
54
 
55
  resampler = torchaudio.transforms.Resample(48_000, 16_000)
56
 
@@ -89,11 +89,11 @@ import re
89
  test_dataset = load_dataset("common_voice", "pt", split="test")
90
  wer = load_metric("wer")
91
 
92
- processor = Wav2Vec2Processor.from_pretrained("joorock12/wav2vec2-large-xlsr-53-portuguese")
93
- model = Wav2Vec2ForCTC.from_pretrained("joorock12/wav2vec2-large-xlsr-53-portuguese")
94
  model.to("cuda")
95
 
96
- chars_to_ignore_regex = '[\\\\,\\\\?\\\\.\\\\!\\\\-\\\\;\\\\:\\\\"\\\\“]'
97
  resampler = torchaudio.transforms.Resample(48_000, 16_000)
98
 
99
  # Preprocessing the datasets.
 
49
 
50
  test_dataset = load_dataset("common_voice", "pt", split="test[:2%]")
51
 
52
+ processor = Wav2Vec2Processor.from_pretrained("joorock12/wav2vec2-large-xlsr-portuguese")
53
+ model = Wav2Vec2ForCTC.from_pretrained("joorock12/wav2vec2-large-xlsr-portuguese")
54
 
55
  resampler = torchaudio.transforms.Resample(48_000, 16_000)
56
 
 
89
  test_dataset = load_dataset("common_voice", "pt", split="test")
90
  wer = load_metric("wer")
91
 
92
+ processor = Wav2Vec2Processor.from_pretrained("joorock12/wav2vec2-large-xlsr-portuguese")
93
+ model = Wav2Vec2ForCTC.from_pretrained("joorock12/wav2vec2-large-xlsr-portuguese")
94
  model.to("cuda")
95
 
96
+ chars_to_ignore_regex = '[\,\?\.\!\-\;\:\"\“\'\�]'
97
  resampler = torchaudio.transforms.Resample(48_000, 16_000)
98
 
99
  # Preprocessing the datasets.